cogs/media/tts.py

import asyncio
import io
import tempfile
from typing import Optional

import discord
from discord import app_commands
from discord.ext import commands
from gtts import gTTS


DEFAULT_LANG = "en"

def tts_command():

    async def send_embed(
        context: commands.Context,
        embed: discord.Embed,
        *,
        ephemeral: bool = False,
        file: Optional[discord.File] = None,
    ) -> None:
        interaction = getattr(context, "interaction", None)
        if interaction is not None:
            if interaction.response.is_done():
                if file:
                    await interaction.followup.send(embed=embed, file=file, ephemeral=ephemeral)
                else:
                    await interaction.followup.send(embed=embed, ephemeral=ephemeral)
            else:
                if file:
                    await interaction.response.send_message(embed=embed, file=file, ephemeral=ephemeral)
                else:
                    await interaction.response.send_message(embed=embed, ephemeral=ephemeral)
        else:
            if file:
                await context.send(embed=embed, file=file)
            else:
                await context.send(embed=embed)

    async def generate_tts_audio(text: str) -> tuple[Optional[bytes], Optional[str]]:
        try:
            loop = asyncio.get_event_loop()
            audio_bytes = await loop.run_in_executor(
                None,
                lambda: _generate_tts_sync(text)
            )
            return audio_bytes, None
        except Exception as e:
            return None, str(e)

    def _generate_tts_sync(text: str) -> bytes:
        tts = gTTS(text=text, lang=DEFAULT_LANG, slow=False)
        fp = io.BytesIO()
        tts.write_to_fp(fp)
        fp.seek(0)
        return fp.read()

    @commands.hybrid_command(
        name="tts",
        description="Convert text to speech using Google Text-to-Speech.",
    )
    @app_commands.describe(
        text="The text to convert to speech",
    )
    async def tts(context: commands.Context, text: Optional[str] = None):
        if not text or not text.strip():
            if context.message and context.message.reference and context.message.reference.resolved:
                referenced = context.message.reference.resolved
                if isinstance(referenced, discord.Message) and referenced.content:
                    text = referenced.content
        if not text or not text.strip():
            embed = (
                discord.Embed(
                    title="Error",
                    description="Please provide text to convert or reply to a message containing text.",
                    color=0xE02B2B,
                ).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
            )
            await send_embed(context, embed, ephemeral=True)
            return

        text = text.strip()
        if len(text) > 500:
            embed = (
                discord.Embed(
                    title="Error",
                    description="Text is too long. Please limit to 500 characters.",
                    color=0xE02B2B,
                ).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
            )
            await send_embed(context, embed, ephemeral=True)
            return

        processing_embed = (
            discord.Embed(
                title="TTS (Processing)",
                description="<a:mariospin:1423677027013103709> Generating speech...",
                color=0x7289DA,
            ).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
        )

        interaction = getattr(context, "interaction", None)
        processing_message = None
        sent_initial_interaction_response = False

        if interaction is not None:
            if interaction.response.is_done():
                processing_message = await interaction.followup.send(embed=processing_embed, ephemeral=True)
            else:
                await interaction.response.send_message(embed=processing_embed, ephemeral=True)
                sent_initial_interaction_response = True
        else:
            processing_message = await context.send(embed=processing_embed)

        audio_bytes, error = await generate_tts_audio(text)

        if error or not audio_bytes:
            embed = (
                discord.Embed(
                    title="Error",
                    description=f"Failed to generate speech. {error or 'Unknown error.'}",
                    color=0xE02B2B,
                ).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
            )
            await send_embed(context, embed, ephemeral=True)
            if interaction is not None and sent_initial_interaction_response:
                try:
                    await interaction.delete_original_response()
                except Exception:
                    pass
            if processing_message:
                try:
                    await processing_message.delete()
                except Exception:
                    pass
            return

        audio_file = discord.File(
            io.BytesIO(audio_bytes),
            filename="audio.mp3",
        )

        embed = (
            discord.Embed(
                title="Text-to-Speech",
                description=f"**Input:** {text}",
                color=0x7289DA,
            )
            .set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")
            .set_footer(
                text=f"Requested by {context.author.display_name}",
                icon_url=getattr(context.author.display_avatar, "url", None),
            )
        )

        if interaction is not None:
            await context.channel.send(embed=embed)
            await context.channel.send(file=audio_file)
            try:
                await interaction.delete_original_response()
            except:
                pass
        else:
            await processing_message.delete()
            await context.channel.send(embed=embed)
            await context.channel.send(file=audio_file)

    return tts
feat(tts): new command Co-authored-by: neoarz <tyrantneo740@gmail.com> 2025-10-15 06:35:19 +02:00			`import asyncio`
			`import io`
			`import tempfile`
			`from typing import Optional`

			`import discord`
			`from discord import app_commands`
			`from discord.ext import commands`
			`from gtts import gTTS`


			`DEFAULT_LANG = "en"`

			`def tts_command():`

			`async def send_embed(`
			`context: commands.Context,`
			`embed: discord.Embed,`
			`*,`
			`ephemeral: bool = False,`
			`file: Optional[discord.File] = None,`
			`) -> None:`
			`interaction = getattr(context, "interaction", None)`
			`if interaction is not None:`
			`if interaction.response.is_done():`
			`if file:`
			`await interaction.followup.send(embed=embed, file=file, ephemeral=ephemeral)`
			`else:`
			`await interaction.followup.send(embed=embed, ephemeral=ephemeral)`
			`else:`
			`if file:`
			`await interaction.response.send_message(embed=embed, file=file, ephemeral=ephemeral)`
			`else:`
			`await interaction.response.send_message(embed=embed, ephemeral=ephemeral)`
			`else:`
			`if file:`
			`await context.send(embed=embed, file=file)`
			`else:`
			`await context.send(embed=embed)`

			`async def generate_tts_audio(text: str) -> tuple[Optional[bytes], Optional[str]]:`
			`try:`
			`loop = asyncio.get_event_loop()`
			`audio_bytes = await loop.run_in_executor(`
			`None,`
			`lambda: _generate_tts_sync(text)`
			`)`
			`return audio_bytes, None`
			`except Exception as e:`
			`return None, str(e)`

			`def _generate_tts_sync(text: str) -> bytes:`
			`tts = gTTS(text=text, lang=DEFAULT_LANG, slow=False)`
			`fp = io.BytesIO()`
			`tts.write_to_fp(fp)`
			`fp.seek(0)`
			`return fp.read()`

			`@commands.hybrid_command(`
			`name="tts",`
			`description="Convert text to speech using Google Text-to-Speech.",`
			`)`
			`@app_commands.describe(`
			`text="The text to convert to speech",`
			`)`
			`async def tts(context: commands.Context, text: Optional[str] = None):`
			`if not text or not text.strip():`
			`if context.message and context.message.reference and context.message.reference.resolved:`
			`referenced = context.message.reference.resolved`
			`if isinstance(referenced, discord.Message) and referenced.content:`
			`text = referenced.content`
			`if not text or not text.strip():`
			`embed = (`
			`discord.Embed(`
			`title="Error",`
			`description="Please provide text to convert or reply to a message containing text.",`
			`color=0xE02B2B,`
			`).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")`
			`)`
			`await send_embed(context, embed, ephemeral=True)`
			`return`

			`text = text.strip()`
			`if len(text) > 500:`
			`embed = (`
			`discord.Embed(`
			`title="Error",`
			`description="Text is too long. Please limit to 500 characters.",`
			`color=0xE02B2B,`
			`).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")`
			`)`
			`await send_embed(context, embed, ephemeral=True)`
			`return`

			`processing_embed = (`
			`discord.Embed(`
			`title="TTS (Processing)",`
			`description="<a:mariospin:1423677027013103709> Generating speech...",`
			`color=0x7289DA,`
			`).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")`
			`)`

			`interaction = getattr(context, "interaction", None)`
			`processing_message = None`
			`sent_initial_interaction_response = False`

			`if interaction is not None:`
			`if interaction.response.is_done():`
			`processing_message = await interaction.followup.send(embed=processing_embed, ephemeral=True)`
			`else:`
			`await interaction.response.send_message(embed=processing_embed, ephemeral=True)`
			`sent_initial_interaction_response = True`
			`else:`
			`processing_message = await context.send(embed=processing_embed)`

			`audio_bytes, error = await generate_tts_audio(text)`

			`if error or not audio_bytes:`
			`embed = (`
			`discord.Embed(`
			`title="Error",`
			`description=f"Failed to generate speech. {error or 'Unknown error.'}",`
			`color=0xE02B2B,`
			`).set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")`
			`)`
			`await send_embed(context, embed, ephemeral=True)`
			`if interaction is not None and sent_initial_interaction_response:`
			`try:`
			`await interaction.delete_original_response()`
			`except Exception:`
			`pass`
			`if processing_message:`
			`try:`
			`await processing_message.delete()`
			`except Exception:`
			`pass`
			`return`

			`audio_file = discord.File(`
			`io.BytesIO(audio_bytes),`
			`filename="audio.mp3",`
			`)`

			`embed = (`
			`discord.Embed(`
			`title="Text-to-Speech",`
			`description=f"Input: {text}",`
			`color=0x7289DA,`
			`)`
			`.set_author(name="Media", icon_url="https://yes.nighty.works/raw/y5SEZ9.webp")`
			`.set_footer(`
			`text=f"Requested by {context.author.display_name}",`
			`icon_url=getattr(context.author.display_avatar, "url", None),`
			`)`
			`)`

			`if interaction is not None:`
			`await context.channel.send(embed=embed)`
			`await context.channel.send(file=audio_file)`
			`try:`
			`await interaction.delete_original_response()`
			`except:`
			`pass`
			`else:`
			`await processing_message.delete()`
			`await context.channel.send(embed=embed)`
			`await context.channel.send(file=audio_file)`

			`return tts`