Edge-TTS-Text-to-Speech

Sleeping

App Files Files Community

EmRa228 commited on May 8

Commit

ac7fa1f

verified ·

1 Parent(s): 6b78aa7

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -21

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import edge_tts
 import asyncio
 import tempfile
-# 1) Fetch voices once, synchronously at startup
 def load_voices():
     loop = asyncio.get_event_loop()
     voices = loop.run_until_complete(edge_tts.list_voices())
@@ -14,14 +14,14 @@ def load_voices():
 VOICES = load_voices()
-# 2) Async function to drive Edge TTS
 async def _text_to_speech(text, short_name, rate_str, pitch_str):
-    communicate = edge_tts.Communicate(text, short_name, rate=rate_str, pitch=pitch_str)
     with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp:
-        await communicate.save(tmp.name)
         return tmp.name
-# 3) Sync wrapper for the click callback
 def tts_interface(text, voice_choice, rate, pitch):
     if not text.strip():
         return None, "🚨 Please enter some text."
@@ -31,7 +31,6 @@ def tts_interface(text, voice_choice, rate, pitch):
     rate_str  = f"{rate:+d}%"
     pitch_str = f"{pitch:+d}Hz"
     try:
-        # Run the async TTS call synchronously
         audio_path = asyncio.get_event_loop().run_until_complete(
             _text_to_speech(text, short_name, rate_str, pitch_str)
         )
@@ -39,35 +38,34 @@ def tts_interface(text, voice_choice, rate, pitch):
     except Exception as e:
         return None, f"❌ TTS failed: {e}"
-# 4) Build the Gradio Blocks UI
 def create_demo():
     with gr.Blocks(analytics_enabled=False) as demo:
         gr.Markdown("# 🎙️ Edge TTS on Hugging Face Spaces")
-        with gr.Row():
-            gr.Markdown("""
-**Convert your text to speech** using Microsoft Edge's neural voices.
-Adjust rate and pitch to fine-tune the output.
-""")
         with gr.Row():
-            txt = gr.Textbox(label="Input Text", lines=5, placeholder="Type something…")
-            vox = gr.Dropdown(choices=list(VOICES.keys()), label="Voice")
-            rate = gr.Slider(-50, 50, value=0, label="Rate (%)")
             pitch = gr.Slider(-20, 20, value=0, label="Pitch (Hz)")
-        btn = gr.Button("Generate Speech")
         audio_out = gr.Audio(type="filepath", label="Audio Output")
-        warn_md  = gr.Markdown("", label="Warnings / Errors")
-        # IMPORTANT: wire queue here so the frontend finds /api/predict
         btn.click(
             fn=tts_interface,
             inputs=[txt, vox, rate, pitch],
             outputs=[audio_out, warn_md]
         )
-        # Enable the queue on the entire app
         demo.queue()
     return demo
@@ -75,5 +73,4 @@ Adjust rate and pitch to fine-tune the output.
 # 5) Launch
 if __name__ == "__main__":
     demo = create_demo()
-    # On Spaces, this will serve on 0.0.0.0:7860 automatically
-    demo.launch()

 import asyncio
 import tempfile
+# 1) Load voices once at startup
 def load_voices():
     loop = asyncio.get_event_loop()
     voices = loop.run_until_complete(edge_tts.list_voices())
 VOICES = load_voices()
+# 2) Async TTS worker
 async def _text_to_speech(text, short_name, rate_str, pitch_str):
+    comm = edge_tts.Communicate(text, short_name, rate=rate_str, pitch=pitch_str)
     with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp:
+        await comm.save(tmp.name)
         return tmp.name
+# 3) Synchronous wrapper for Gradio callback
 def tts_interface(text, voice_choice, rate, pitch):
     if not text.strip():
         return None, "🚨 Please enter some text."
     rate_str  = f"{rate:+d}%"
     pitch_str = f"{pitch:+d}Hz"
     try:
         audio_path = asyncio.get_event_loop().run_until_complete(
             _text_to_speech(text, short_name, rate_str, pitch_str)
         )
     except Exception as e:
         return None, f"❌ TTS failed: {e}"
+# 4) Build Gradio Blocks UI
 def create_demo():
     with gr.Blocks(analytics_enabled=False) as demo:
         gr.Markdown("# 🎙️ Edge TTS on Hugging Face Spaces")
+        gr.Markdown(
+            "**Convert your text to speech** using Microsoft Edge's neural voices. "
+            "Adjust rate and pitch to fine-tune the output."
+        )
         with gr.Row():
+            txt   = gr.Textbox(label="Input Text", lines=5, placeholder="Type something…")
+            vox   = gr.Dropdown(choices=list(VOICES.keys()), label="Voice")
+            rate  = gr.Slider(-50, 50, value=0, label="Rate (%)")
             pitch = gr.Slider(-20, 20, value=0, label="Pitch (Hz)")
+        btn       = gr.Button("Generate Speech")
         audio_out = gr.Audio(type="filepath", label="Audio Output")
+        warn_md   = gr.Markdown("", label="Warnings / Errors")
+        # Wire the callback and register the /api endpoints
         btn.click(
             fn=tts_interface,
             inputs=[txt, vox, rate, pitch],
             outputs=[audio_out, warn_md]
         )
+        # Enable queuing so that Gradio registers its API
         demo.queue()
     return demo
 # 5) Launch
 if __name__ == "__main__":
     demo = create_demo()
+    demo.launch()