mirror of
https://github.com/neoarz/Syntrel.git
synced 2025-12-25 03:40:11 +01:00
169
cogs/media/tts.py
Normal file
169
cogs/media/tts.py
Normal file
@@ -0,0 +1,169 @@
|
||||
import asyncio
|
||||
import io
|
||||
import tempfile
|
||||
from typing import Optional
|
||||
|
||||
import discord
|
||||
from discord import app_commands
|
||||
from discord.ext import commands
|
||||
from gtts import gTTS
|
||||
|
||||
|
||||
DEFAULT_LANG = "en"
|
||||
|
||||
def tts_command():
|
||||
|
||||
async def send_embed(
|
||||
context: commands.Context,
|
||||
embed: discord.Embed,
|
||||
*,
|
||||
ephemeral: bool = False,
|
||||
file: Optional[discord.File] = None,
|
||||
) -> None:
|
||||
interaction = getattr(context, "interaction", None)
|
||||
if interaction is not None:
|
||||
if interaction.response.is_done():
|
||||
if file:
|
||||
await interaction.followup.send(embed=embed, file=file, ephemeral=ephemeral)
|
||||
else:
|
||||
await interaction.followup.send(embed=embed, ephemeral=ephemeral)
|
||||
else:
|
||||
if file:
|
||||
await interaction.response.send_message(embed=embed, file=file, ephemeral=ephemeral)
|
||||
else:
|
||||
await interaction.response.send_message(embed=embed, ephemeral=ephemeral)
|
||||
else:
|
||||
if file:
|
||||
await context.send(embed=embed, file=file)
|
||||
else:
|
||||
await context.send(embed=embed)
|
||||
|
||||
async def generate_tts_audio(text: str) -> tuple[Optional[bytes], Optional[str]]:
|
||||
try:
|
||||
loop = asyncio.get_event_loop()
|
||||
audio_bytes = await loop.run_in_executor(
|
||||
None,
|
||||
lambda: _generate_tts_sync(text)
|
||||
)
|
||||
return audio_bytes, None
|
||||
except Exception as e:
|
||||
return None, str(e)
|
||||
|
||||
def _generate_tts_sync(text: str) -> bytes:
|
||||
tts = gTTS(text=text, lang=DEFAULT_LANG, slow=False)
|
||||
fp = io.BytesIO()
|
||||
tts.write_to_fp(fp)
|
||||
fp.seek(0)
|
||||
return fp.read()
|
||||
|
||||
@commands.hybrid_command(
|
||||
name="tts",
|
||||
description="Convert text to speech using Google Text-to-Speech.",
|
||||
)
|
||||
@app_commands.describe(
|
||||
text="The text to convert to speech",
|
||||
)
|
||||
async def tts(context: commands.Context, text: Optional[str] = None):
|
||||
if not text or not text.strip():
|
||||
if context.message and context.message.reference and context.message.reference.resolved:
|
||||
referenced = context.message.reference.resolved
|
||||
if isinstance(referenced, discord.Message) and referenced.content:
|
||||
text = referenced.content
|
||||
if not text or not text.strip():
|
||||
embed = (
|
||||
discord.Embed(
|
||||
title="Error",
|
||||
description="Please provide text to convert or reply to a message containing text.",
|
||||
color=0xE02B2B,
|
||||
).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
|
||||
)
|
||||
await send_embed(context, embed, ephemeral=True)
|
||||
return
|
||||
|
||||
text = text.strip()
|
||||
if len(text) > 500:
|
||||
embed = (
|
||||
discord.Embed(
|
||||
title="Error",
|
||||
description="Text is too long. Please limit to 500 characters.",
|
||||
color=0xE02B2B,
|
||||
).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
|
||||
)
|
||||
await send_embed(context, embed, ephemeral=True)
|
||||
return
|
||||
|
||||
processing_embed = (
|
||||
discord.Embed(
|
||||
title="TTS (Processing)",
|
||||
description="<a:mariospin:1423677027013103709> Generating speech...",
|
||||
color=0x7289DA,
|
||||
).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
|
||||
)
|
||||
|
||||
interaction = getattr(context, "interaction", None)
|
||||
processing_message = None
|
||||
sent_initial_interaction_response = False
|
||||
|
||||
if interaction is not None:
|
||||
if interaction.response.is_done():
|
||||
processing_message = await interaction.followup.send(embed=processing_embed, ephemeral=True)
|
||||
else:
|
||||
await interaction.response.send_message(embed=processing_embed, ephemeral=True)
|
||||
sent_initial_interaction_response = True
|
||||
else:
|
||||
processing_message = await context.send(embed=processing_embed)
|
||||
|
||||
audio_bytes, error = await generate_tts_audio(text)
|
||||
|
||||
if error or not audio_bytes:
|
||||
embed = (
|
||||
discord.Embed(
|
||||
title="Error",
|
||||
description=f"Failed to generate speech. {error or 'Unknown error.'}",
|
||||
color=0xE02B2B,
|
||||
).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
|
||||
)
|
||||
await send_embed(context, embed, ephemeral=True)
|
||||
if interaction is not None and sent_initial_interaction_response:
|
||||
try:
|
||||
await interaction.delete_original_response()
|
||||
except Exception:
|
||||
pass
|
||||
if processing_message:
|
||||
try:
|
||||
await processing_message.delete()
|
||||
except Exception:
|
||||
pass
|
||||
return
|
||||
|
||||
audio_file = discord.File(
|
||||
io.BytesIO(audio_bytes),
|
||||
filename="audio.mp3",
|
||||
)
|
||||
|
||||
embed = (
|
||||
discord.Embed(
|
||||
title="Text-to-Speech",
|
||||
description=f"**Input:** {text}",
|
||||
color=0x7289DA,
|
||||
)
|
||||
.set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
|
||||
.set_footer(
|
||||
text=f"Requested by {context.author.display_name}",
|
||||
icon_url=getattr(context.author.display_avatar, "url", None),
|
||||
)
|
||||
)
|
||||
|
||||
if interaction is not None:
|
||||
await context.channel.send(embed=embed)
|
||||
await context.channel.send(file=audio_file)
|
||||
try:
|
||||
await interaction.delete_original_response()
|
||||
except:
|
||||
pass
|
||||
else:
|
||||
await processing_message.delete()
|
||||
await context.channel.send(embed=embed)
|
||||
await context.channel.send(file=audio_file)
|
||||
|
||||
return tts
|
||||
Reference in New Issue
Block a user