Spaces:

sulaimank
/

luganda-TTS

Sleeping

App Files Files Community

sulaimank commited on 27 days ago

Commit

fa96784

verified ·

1 Parent(s): d3ac76b

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -15

app.py CHANGED Viewed

@@ -7,44 +7,57 @@ from TTS.utils.synthesizer import Synthesizer
 # Max input text length
 MAX_TXT_LEN = 400
-# Use a single checkpoint from your repo
-MODEL_FILE = "checkpoint_2080000.pth"
-# Download config and checkpoint once
 config_path = hf_hub_download("sulaimank/luganda_LMs", filename="config.json")
-model_path = hf_hub_download("sulaimank/luganda_LMs", filename=MODEL_FILE)
-# Load synthesizer at startup
-synthesizer = Synthesizer(
-    tts_checkpoint=model_path,
-    tts_config_path=config_path
-)
-def tts(text: str):
     if len(text) > MAX_TXT_LEN:
         text = text[:MAX_TXT_LEN]
         print(f"⚠️ Input truncated to {MAX_TXT_LEN} characters.")
     wav = synthesizer.tts(text)
-    # Save temp wav for playback
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
         synthesizer.save_wav(wav, fp.name)
         return fp.name
 # Example sentences
 examples = [
-    ["Nalubaale y'ennyanja esinga obunene mu Uganda."],
 ]
 description = """
-🗣️ **Luganda TTS Demo** 🗣️
-Convert Luganda text into speech using a VITS model trained with Coqui TTS.
 """
 iface = gr.Interface(
     fn=tts,
-    inputs=gr.Textbox(label="Enter Luganda Text", value="Kampala kye kibuga kya Uganda ekikulu."),
     outputs=gr.Audio(label="Generated Speech", type="filepath"),
     examples=examples,
     title="Luganda TTS",

 # Max input text length
 MAX_TXT_LEN = 400
+# Map simple names (Model 1, Model 2...) to checkpoint files
+MODEL_INFO = {
+    "Model 1": "checkpoint_2080000.pth",
+    "Model 2": "checkpoint_2085000.pth",
+    "Model 3": "checkpoint_2090000.pth",
+    "Model 4": "checkpoint_2095000.pth",
+    "Model 5": "checkpoint_2100000.pth",
+}
+# Download config once
 config_path = hf_hub_download("sulaimank/luganda_LMs", filename="config.json")
+def load_synth(model_file):
+    """Download and initialize the chosen synthesizer"""
+    model_path = hf_hub_download("sulaimank/luganda_LMs", filename=model_file)
+    return Synthesizer(
+        tts_checkpoint=model_path,
+        tts_config_path=config_path
+    )
+def tts(text: str, model_choice: str):
     if len(text) > MAX_TXT_LEN:
         text = text[:MAX_TXT_LEN]
         print(f"⚠️ Input truncated to {MAX_TXT_LEN} characters.")
+    synthesizer = load_synth(MODEL_INFO[model_choice])
     wav = synthesizer.tts(text)
+    # Save temp wav file for playback
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
         synthesizer.save_wav(wav, fp.name)
         return fp.name
 # Example sentences
 examples = [
+    ["Nnalubaale egabirirwa emigga mingi nnyo, nga mu gino, egisinga obunene mulimu Katonga, nga guno gusibuka mu bitundu eby'obugwanjuba bwa Uganda.", "Model 1"],
+    ["Kampala kye kibuga kya Uganda ekikulu.", "Model 5"],
 ]
 description = """
+🗣️ **Luganda TTS** 🗣️
+Convert Luganda text into speech using VITS models.
+Choose one of the available models to compare synthesis quality.
 """
 iface = gr.Interface(
     fn=tts,
+    inputs=[
+        gr.Textbox(label="Enter Luganda Text", value="Gyebale ko ssebo."),
+        gr.Radio(label="Choose Model", choices=list(MODEL_INFO.keys()), value="Model 1"),
+    ],
     outputs=gr.Audio(label="Generated Speech", type="filepath"),
     examples=examples,
     title="Luganda TTS",