Edge-TTS-Text-to-Speech

Sleeping

App Files Files Community

EmRa228 commited on May 8, 2025

Commit

a257b37

verified ·

1 Parent(s): 3e4c239

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -45

app.py CHANGED Viewed

@@ -1,81 +1,70 @@
 import os
 import gradio as gr
-import edge_tts
 import asyncio
 import tempfile
-# 1) Load voices once at startup
 def load_voices():
     loop = asyncio.get_event_loop()
     voices = loop.run_until_complete(edge_tts.list_voices())
-    return {
-        f"{v['ShortName']} - {v['Locale']} ({v['Gender']})": v['ShortName']
-        for v in voices
-    }
 VOICES = load_voices()
-# 2) Async TTS worker
-async def _text_to_speech(text, short_name, rate_str, pitch_str):
     comm = edge_tts.Communicate(text, short_name, rate=rate_str, pitch=pitch_str)
     with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp:
         await comm.save(tmp.name)
         return tmp.name
-# 3) Sync wrapper for Gradio callback
-def tts_interface(text, voice_choice, rate, pitch):
     if not text.strip():
-        return None, "🚨 Please enter text."
-    if not voice_choice:
-        return None, "🚨 Please select a voice."
-    short_name = voice_choice.split(" - ")[0]
-    rate_str  = f"{rate:+d}%"
-    pitch_str = f"{pitch:+d}Hz"
     try:
-        audio_path = asyncio.get_event_loop().run_until_complete(
-            _text_to_speech(text, short_name, rate_str, pitch_str)
         )
-        return audio_path, ""
     except Exception as e:
-        return None, f"❌ TTS error: {e}"
-# 4) Build the Gradio UI
-def create_demo():
     with gr.Blocks(analytics_enabled=False) as demo:
-        gr.Markdown("# 🎙️ Edge TTS on Hugging Face Spaces")
-        gr.Markdown(
-            "**Convert your text to speech** using Microsoft Edge’s neural voices. "
-            "Adjust rate and pitch to fine-tune the output."
-        )
         with gr.Row():
-            txt   = gr.Textbox(label="Input Text", lines=5, placeholder="Type here…")
-            vox   = gr.Dropdown(choices=list(VOICES.keys()), label="Voice")
-            rate  = gr.Slider(-50, 50, value=0, label="Rate (%)")
-            pitch = gr.Slider(-20, 20, value=0, label="Pitch (Hz)")
-        btn       = gr.Button("Generate Speech")
-        audio_out = gr.Audio(type="filepath", label="Output Audio")
-        warn_md   = gr.Markdown("", label="Warnings / Errors")
         btn.click(
             fn=tts_interface,
-            inputs=[txt, vox, rate, pitch],
-            outputs=[audio_out, warn_md]
         )
-        # Register API endpoints
-        demo.queue()
     return demo
 if __name__ == "__main__":
-    demo = create_demo()
-    # 5) Bind to 0.0.0.0 and the port provided by HF Spaces (defaults to 7860 internally)
     port = int(os.environ.get("PORT", 7860))
     demo.launch(
         server_name="0.0.0.0",
         server_port=port,
-        share=False
     )

 import os
 import gradio as gr
 import asyncio
+import edge_tts
 import tempfile
+# Load voices once
 def load_voices():
     loop = asyncio.get_event_loop()
     voices = loop.run_until_complete(edge_tts.list_voices())
+    return {f"{v['ShortName']} - {v['Locale']} ({v['Gender']})": v['ShortName']
+            for v in voices}
 VOICES = load_voices()
+# Async TTS
+async def _tts(text, short_name, rate_str, pitch_str):
     comm = edge_tts.Communicate(text, short_name, rate=rate_str, pitch=pitch_str)
     with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp:
         await comm.save(tmp.name)
         return tmp.name
+# Sync wrapper
+def tts_interface(text, voice, rate, pitch):
     if not text.strip():
+        return None, "🚨 Enter some text."
+    if not voice:
+        return None, "🚨 Select a voice."
+    name = voice.split(" - ")[0]
+    rate_s = f"{rate:+d}%"
+    pitch_s = f"{pitch:+d}Hz"
     try:
+        path = asyncio.get_event_loop().run_until_complete(
+            _tts(text, name, rate_s, pitch_s)
         )
+        return path, ""
     except Exception as e:
+        return None, f"❌ TTS failed: {e}"
+# Build UI
+def create_app():
     with gr.Blocks(analytics_enabled=False) as demo:
+        gr.Markdown("# 🎙️ Edge TTS in Hugging Face Space")
+        gr.Markdown("Convert text to speech with Microsoft Edge voices.")
         with gr.Row():
+            txt  = gr.Textbox(lines=5, label="Input Text")
+            vox  = gr.Dropdown(list(VOICES.keys()), label="Voice")
+            rate = gr.Slider(-50, 50, value=0, label="Rate (%)")
+            pit  = gr.Slider(-20, 20, value=0, label="Pitch (Hz)")
+        btn = gr.Button("Generate")
+        out_audio = gr.Audio(type="filepath", label="Audio")
+        warn = gr.Markdown("", label="Warning")
         btn.click(
             fn=tts_interface,
+            inputs=[txt, vox, rate, pit],
+            outputs=[out_audio, warn]
         )
+        demo.queue()  # Register /api endpoints
     return demo
 if __name__ == "__main__":
+    demo = create_app()
     port = int(os.environ.get("PORT", 7860))
     demo.launch(
         server_name="0.0.0.0",
         server_port=port,
+        ssr_mode=False  # disable SSR introspection errors
     )