Spaces:

MALIBA-AI
/

BambaraText2Speech

Running on Zero

App Files Files Community

sudoping01 commited on 8 days ago

Commit

9b1a61d

verified ·

1 Parent(s): e347941

Update app.py

Browse files

Files changed (1) hide show

app.py +38 -36

app.py CHANGED Viewed

@@ -104,7 +104,7 @@ def initialize_model_once():
         start_time = time.time()
         # Use the new import structure from the README
-        from maliba_ai.tts import BambaraTTSInference
         model = BambaraTTSInference()
         speakers = get_speakers_dict()
@@ -233,7 +233,7 @@ def get_speaker_names():
 SPEAKER_NAMES = get_speaker_names()
-# Examples with variety of lengths - use only available speakers with fallbacks
 examples = [
     ["Aw ni ce", "Adama"],  # Natural conversational greeting
     ["Mali bɛna diya kɔsɛbɛ, ka a da a kan baara bɛ ka kɛ.", "Moussa"],  # Clear pronunciation for informative content
@@ -244,32 +244,37 @@ examples = [
     ["Aw ni ce. Ne tɔgɔ ye Adama. Awɔ, ne ye maliden de ye. Aw Sanbɛ Sanbɛ. San min tɛ ɲinan ye, an bɛɛ ka jɛ ka o seli ɲɔgɔn fɛ, hɛɛrɛ ni lafiya la. Ala ka Mali suma. Ala ka Mali yiriwa. Ala ka Mali taa ɲɛ. Ala ka an ka seliw caya. Ala ka yafa an bɛɛ ma.", "Moussa"],  # Clear pronunciation for heartfelt long message
     ["An dɔlakelen bɛ masike bilenman don ka tɔw gɛn.", "Bourama"],  # Most stable for complex statement
     ["Aw ni ce. Seidu bɛ aw fo wa aw ka yafa a ma, ka da a kan tuma dɔw la kow ka can.", "Modibo"],  # Expressive delivery for personal greeting
 ]
-# Additional examples for when all 10 speakers are available
-def get_examples_for_available_speakers():
-    """Generate examples based on available speakers"""
-    base_examples = examples.copy()
-    # Add more examples if we have more speakers available
-    if len(SPEAKER_NAMES) > 5:
-        additional_examples = []
-        # Add examples for additional speakers if they exist
-        if "Amadou" in SPEAKER_NAMES:
-            additional_examples.append(["To tɔ nantan ni lafiya, o ka fisa ni so fa dumuniba kɛlɛma ye.", "Amadou"])
-        if "Bakary" in SPEAKER_NAMES:
-            additional_examples.append(["Mali ye jamana ɲuman ye!", "Bakary"])
-        if "Ngolo" in SPEAKER_NAMES:
-            additional_examples.append(["An ka ɲɔgɔn dɛmɛ ka baara kɛ ɲɔgɔn fɛ", "Ngolo"])
-        if "Ibrahima" in SPEAKER_NAMES:
-            additional_examples.append(["Hakili to yɔrɔ min na, sabali bɛ yen", "Ibrahima"])
-        if "Amara" in SPEAKER_NAMES:
-            additional_examples.append(["Dɔnko ɲuman ye, a bɛ dɔn mɔgɔ kɔnɔ", "Amara"])
-        base_examples.extend(additional_examples)
-    return base_examples
 def build_interface():
     """Build the Gradio interface - simplified like your old working version"""
@@ -369,17 +374,15 @@ def build_interface():
             gr.Markdown("**Click any example below:**")
-            # Use dynamic examples based on available speakers
-            current_examples = get_examples_for_available_speakers()
-            for i, (text, speaker) in enumerate(current_examples):
-                # Only show examples for speakers that are actually available
-                if speaker in SPEAKER_NAMES:
-                    btn = gr.Button(f"{text[:30]}{'...' if len(text) > 30 else ''}", size="sm")
-                    btn.click(
-                        fn=lambda t=text, s=speaker: load_example(t, s),
-                        outputs=[text_input, speaker_dropdown, use_advanced, temperature, top_k, top_p, max_tokens]
-                    )
         with gr.Accordion("About", open=False):
             gr.Markdown(f"""
@@ -441,8 +444,7 @@ def build_interface():
 def main():
     """Main function to launch the Gradio interface"""
     logger.info("Starting Bambara TTS Gradio interface.")
-    # DO NOT preload - let it initialize on first request only (like your working version)
     interface = build_interface()
     interface.launch(
         server_name="0.0.0.0",

         start_time = time.time()
         # Use the new import structure from the README
+        from maliba_ai.tts.inference import BambaraTTSInference
         model = BambaraTTSInference()
         speakers = get_speakers_dict()
 SPEAKER_NAMES = get_speaker_names()
+# Examples representing ALL 10 speakers - with fallbacks for missing speakers
 examples = [
     ["Aw ni ce", "Adama"],  # Natural conversational greeting
     ["Mali bɛna diya kɔsɛbɛ, ka a da a kan baara bɛ ka kɛ.", "Moussa"],  # Clear pronunciation for informative content
     ["Aw ni ce. Ne tɔgɔ ye Adama. Awɔ, ne ye maliden de ye. Aw Sanbɛ Sanbɛ. San min tɛ ɲinan ye, an bɛɛ ka jɛ ka o seli ɲɔgɔn fɛ, hɛɛrɛ ni lafiya la. Ala ka Mali suma. Ala ka Mali yiriwa. Ala ka Mali taa ɲɛ. Ala ka an ka seliw caya. Ala ka yafa an bɛɛ ma.", "Moussa"],  # Clear pronunciation for heartfelt long message
     ["An dɔlakelen bɛ masike bilenman don ka tɔw gɛn.", "Bourama"],  # Most stable for complex statement
     ["Aw ni ce. Seidu bɛ aw fo wa aw ka yafa a ma, ka da a kan tuma dɔw la kow ka can.", "Modibo"],  # Expressive delivery for personal greeting
+    ["To tɔ nantan ni lafiya, o ka fisa ni so fa dumuniba kɛlɛma ye.", "Amadou"],  # Warm and friendly voice for wisdom saying
+    ["Mali ye jamana ɲuman ye!", "Bakary"],  # Deep, authoritative tone for patriotic statement
+    ["An ka ɲɔgɔn dɛmɛ ka baara kɛ ɲɔgɔn fɛ", "Ngolo"],  # Youthful and energetic for collaboration
+    ["Hakili bɛ yɔrɔ min na, sabali bɛ yen", "Ibrahima"],  # Calm and measured for philosophical thought
+    ["Aw ni ce. Seidu bɛ aw fo wa aw ka yafa a ma, ka da a kan tuma dɔw la kow ka can.", "Amara"],  # Melodic and smooth for poetic expression
 ]
+def get_safe_examples():
+    """Get examples with speaker fallbacks for missing speakers"""
+    safe_examples = []
+    # Fallback mapping for missing speakers
+    fallback_speakers = {
+        "Amadou": "Adama",    # Warm -> Natural conversational
+        "Bakary": "Modibo",   # Authoritative -> Expressive
+        "Ngolo": "Adama",     # Youthful -> Natural conversational
+        "Ibrahima": "Seydou", # Calm -> Balanced
+        "Amara": "Moussa"     # Melodic -> Clear pronunciation
+    }
+    for text, speaker in examples:
+        # Use original speaker if available, otherwise use fallback
+        if speaker in SPEAKER_NAMES:
+            safe_examples.append([text, speaker])
+        elif speaker in fallback_speakers and fallback_speakers[speaker] in SPEAKER_NAMES:
+            safe_examples.append([text, fallback_speakers[speaker]])
+        else:
+            # Final fallback to first available speaker
+            safe_examples.append([text, SPEAKER_NAMES[0]])
+    return safe_examples
 def build_interface():
     """Build the Gradio interface - simplified like your old working version"""
             gr.Markdown("**Click any example below:**")
+            # Use safe examples with fallbacks for missing speakers
+            safe_examples = get_safe_examples()
+            for i, (text, speaker) in enumerate(safe_examples):
+                btn = gr.Button(f"{text[:30]}{'...' if len(text) > 30 else ''}", size="sm")
+                btn.click(
+                    fn=lambda t=text, s=speaker: load_example(t, s),
+                    outputs=[text_input, speaker_dropdown, use_advanced, temperature, top_k, top_p, max_tokens]
+                )
         with gr.Accordion("About", open=False):
             gr.Markdown(f"""
 def main():
     """Main function to launch the Gradio interface"""
     logger.info("Starting Bambara TTS Gradio interface.")
     interface = build_interface()
     interface.launch(
         server_name="0.0.0.0",