Spaces:

MALIBA-AI
/

BambaraText2Speech

Running on Zero

App Files Files Community

sudoping01 commited on 8 days ago

Commit

61df640

verified ·

1 Parent(s): e886350

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -9

app.py CHANGED Viewed

@@ -31,9 +31,9 @@ _model_initialized = False
 _initialization_in_progress = False
 def get_speakers_dict():
-    """Get speakers dictionary using the correct import structure"""
     try:
-        # Try new structure first
         from maliba_ai.config.settings import Speakers
         return {
             "Adama": Speakers.Adama,
@@ -48,8 +48,8 @@ def get_speakers_dict():
             "Amara": Speakers.Amara
         }
     except Exception as e:
-        logger.error(f"Failed to import from settings: {e}")
-        # Fallback to old structure (like your working version)
         try:
             from maliba_ai.config.speakers import Adame, Moussa, Bourama, Modibo, Seydou
             return {
@@ -85,7 +85,7 @@ def initialize_model_once():
         logger.info("Initializing Bambara TTS model...")
         start_time = time.time()
-        # Use the same import as your old working version
         from maliba_ai.tts.inference import BambaraTTSInference
         model = BambaraTTSInference()
@@ -174,12 +174,18 @@ def generate_speech(text, speaker_name, use_advanced, temperature, top_k, top_p,
         logger.error(f"Speech generation failed: {e}")
         return None, f"❌ Error: {str(e)}"
-# Use available speakers (try to get 10, fallback to 5)
 def get_speaker_names():
     speakers = get_speakers_dict()
-    if speakers:
         return list(speakers.keys())
-    return ["Adama", "Moussa", "Bourama", "Modibo", "Seydou"]
 SPEAKER_NAMES = get_speaker_names()
@@ -224,7 +230,7 @@ def build_interface():
                     choices=SPEAKER_NAMES,
                     value="Bourama" if "Bourama" in SPEAKER_NAMES else SPEAKER_NAMES[0],
                     label="🗣️ Speaker Voice",
-                    info=f"Choose from {len(SPEAKER_NAMES)} authentic voices"
                 )
                 generate_btn = gr.Button("🎵 Generate Speech", variant="primary", size="lg")
@@ -313,6 +319,18 @@ def build_interface():
             ### 🎭 Available Speakers:
             {', '.join(SPEAKER_NAMES)}
             **License**: Creative Commons Attribution-NonCommercial-ShareAlike 4.0 (CC BY-NC-SA 4.0)
             ---

 _initialization_in_progress = False
 def get_speakers_dict():
+    """Get speakers dictionary using the new SDK structure"""
     try:
+        # Use new structure from maliba_ai.config.settings (as shown in README)
         from maliba_ai.config.settings import Speakers
         return {
             "Adama": Speakers.Adama,
             "Amara": Speakers.Amara
         }
     except Exception as e:
+        logger.error(f"Failed to import from new settings structure: {e}")
+        # Fallback to old structure if new one fails
         try:
             from maliba_ai.config.speakers import Adame, Moussa, Bourama, Modibo, Seydou
             return {
         logger.info("Initializing Bambara TTS model...")
         start_time = time.time()
+        # Use the new import structure from the README
         from maliba_ai.tts.inference import BambaraTTSInference
         model = BambaraTTSInference()
         logger.error(f"Speech generation failed: {e}")
         return None, f"❌ Error: {str(e)}"
+# Use available speakers (prioritize new SDK structure with 10 speakers)
 def get_speaker_names():
     speakers = get_speakers_dict()
+    if speakers and len(speakers) >= 10:
+        # New SDK with all 10 speakers
+        return ["Bourama", "Adama", "Moussa", "Modibo", "Seydou", "Amadou", "Bakary", "Ngolo", "Ibrahima", "Amara"]
+    elif speakers:
+        # Return whatever speakers are available
         return list(speakers.keys())
+    else:
+        # Fallback to old 5 speakers
+        return ["Adama", "Moussa", "Bourama", "Modibo", "Seydou"]
 SPEAKER_NAMES = get_speaker_names()
                     choices=SPEAKER_NAMES,
                     value="Bourama" if "Bourama" in SPEAKER_NAMES else SPEAKER_NAMES[0],
                     label="🗣️ Speaker Voice",
+                    info=f"Choose from {len(SPEAKER_NAMES)} authentic voices (Bourama recommended)"
                 )
                 generate_btn = gr.Button("🎵 Generate Speech", variant="primary", size="lg")
             ### 🎭 Available Speakers:
             {', '.join(SPEAKER_NAMES)}
+            ### 🎯 Speaker Characteristics:
+            - **Bourama**: Most stable and accurate (recommended)
+            - **Adama**: Natural conversational tone
+            - **Moussa**: Clear pronunciation for educational content
+            - **Modibo**: Expressive delivery for storytelling
+            - **Seydou**: Balanced characteristics for general use
+            - **Amadou**: Warm and friendly voice
+            - **Bakary**: Deep, authoritative tone
+            - **Ngolo**: Youthful and energetic
+            - **Ibrahima**: Calm and measured delivery
+            - **Amara**: Melodic and smooth
             **License**: Creative Commons Attribution-NonCommercial-ShareAlike 4.0 (CC BY-NC-SA 4.0)
             ---