Spaces:

ghostai1
/

speechtranslate

Sleeping

App Files Files Community

ghostai1 commited on May 27

Commit

77ab135

verified ·

1 Parent(s): c0f9fa0

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -14

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# Text → Translate → Speech   |   CPU-only Hugging-Face Space
 import tempfile
 from pathlib import Path
@@ -10,9 +10,9 @@ from TTS.api import TTS
 import gradio as gr
 # ─────────────────────────────
-# 1. Allow-list Coqui’s custom RAdam class (Torch ≥2.6)
 # ─────────────────────────────
-torch.serialization.add_safe_globals({"TTS.utils.radam.RAdam": tts_radam.RAdam})
 # ─────────────────────────────
 # 2. Translation pipelines
@@ -21,13 +21,13 @@ PIPE_EN_ES = pipeline("translation", model="Helsinki-NLP/opus-mt-en-es", device=
 PIPE_ES_EN = pipeline("translation", model="Helsinki-NLP/opus-mt-es-en", device=-1)
 # ─────────────────────────────
-# 3. TTS models (Coqui TTS)
 # ─────────────────────────────
 TTS_EN = TTS(model_name="tts_models/en/ljspeech/tacotron2-DDC", progress_bar=False)
 TTS_ES = TTS(model_name="tts_models/es/mai/tacotron2-DDC", progress_bar=False)
 # ─────────────────────────────
-# 4. Helper: synthesize WAV to temp file
 # ─────────────────────────────
 def synthesize(tts_model: TTS, text: str) -> str:
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp:
@@ -36,7 +36,7 @@ def synthesize(tts_model: TTS, text: str) -> str:
     return str(wav_path)
 # ─────────────────────────────
-# 5. Core translate-and-speak function
 # ─────────────────────────────
 def translate_and_speak(txt: str, target_lang: str):
     if not txt.strip():
@@ -45,7 +45,7 @@ def translate_and_speak(txt: str, target_lang: str):
     if target_lang == "Spanish":
         translated = PIPE_EN_ES(txt)[0]["translation_text"]
         audio_file = synthesize(TTS_ES, translated)
-    else:  # English
         translated = PIPE_ES_EN(txt)[0]["translation_text"]
         audio_file = synthesize(TTS_EN, translated)
@@ -57,18 +57,18 @@ def translate_and_speak(txt: str, target_lang: str):
 with gr.Blocks(title="Translator & TTS") as demo:
     gr.Markdown(
         "# 🌐💬 Text → Translate → Speech\n"
-        "Type a sentence, choose target language, and hear it spoken."
     )
-    text_in = gr.Textbox(label="Sentence (English or Spanish)", lines=2)
-    lang    = gr.Radio(["Spanish", "English"], value="Spanish", label="Translate to")
-    run_btn = gr.Button("Translate & Speak", variant="primary")
-    text_out = gr.Textbox(label="Translated text", interactive=False)
-    wav_out  = gr.Audio(label="Speech output", type="filepath")
-    run_btn.click(translate_and_speak, [text_in, lang], [text_out, wav_out])
 if __name__ == "__main__":
     demo.launch(server_name="0.0.0.0")

+# Text → Translate → Speech | CPU-only Hugging-Face Space
 import tempfile
 from pathlib import Path
 import gradio as gr
 # ─────────────────────────────
+# 1. Allow-list Coqui-TTS custom class  (PyTorch ≥ 2.6)
 # ─────────────────────────────
+torch.serialization.add_safe_globals({tts_radam.RAdam})  # ← must pass the class object
 # ─────────────────────────────
 # 2. Translation pipelines
 PIPE_ES_EN = pipeline("translation", model="Helsinki-NLP/opus-mt-es-en", device=-1)
 # ─────────────────────────────
+# 3. TTS models
 # ─────────────────────────────
 TTS_EN = TTS(model_name="tts_models/en/ljspeech/tacotron2-DDC", progress_bar=False)
 TTS_ES = TTS(model_name="tts_models/es/mai/tacotron2-DDC", progress_bar=False)
 # ─────────────────────────────
+# 4. Helper: synthesize WAV
 # ─────────────────────────────
 def synthesize(tts_model: TTS, text: str) -> str:
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as tmp:
     return str(wav_path)
 # ─────────────────────────────
+# 5. Core translate-and-speak
 # ─────────────────────────────
 def translate_and_speak(txt: str, target_lang: str):
     if not txt.strip():
     if target_lang == "Spanish":
         translated = PIPE_EN_ES(txt)[0]["translation_text"]
         audio_file = synthesize(TTS_ES, translated)
+    else:
         translated = PIPE_ES_EN(txt)[0]["translation_text"]
         audio_file = synthesize(TTS_EN, translated)
 with gr.Blocks(title="Translator & TTS") as demo:
     gr.Markdown(
         "# 🌐💬 Text → Translate → Speech\n"
+        "Type a sentence, choose the target language, and hear it spoken."
     )
+    sentence = gr.Textbox(label="Sentence (English or Spanish)", lines=2)
+    lang     = gr.Radio(["Spanish", "English"], value="Spanish", label="Translate to")
+    run_btn  = gr.Button("Translate & Speak", variant="primary")
+    translated_txt = gr.Textbox(label="Translated text", interactive=False)
+    audio_out      = gr.Audio(label="Speech output", type="filepath")
+    run_btn.click(translate_and_speak, [sentence, lang], [translated_txt, audio_out])
 if __name__ == "__main__":
     demo.launch(server_name="0.0.0.0")