Spaces:

MALIBA-AI
/

BambaraText2Speech

Running

App Files Files Community

sudoping01 commited on 9 days ago

Commit

0c96c25

verified ·

1 Parent(s): aa84c77

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -55

app.py CHANGED Viewed

@@ -24,67 +24,38 @@ hf_token = os.getenv("HF_TOKEN")
 if hf_token:
     login(token=hf_token)
-# Global variables for model caching (like your old working version)
 _tts_model = None
 _speakers_dict = None
 _model_initialized = False
 _initialization_in_progress = False
 def get_speakers_dict():
-    """Get speakers dictionary using the correct new SDK structure"""
     try:
-        # Use the correct new structure as shown in your example
         from maliba_ai.config.settings import Speakers
-        # Try to get all 10 speakers, but handle gracefully if some don't exist
-        available_speakers = {}
-        all_speakers = {
-            "Bourama": "Bourama",
-            "Adama": "Adama",
-            "Moussa": "Moussa",
-            "Modibo": "Modibo",
-            "Seydou": "Seydou",
-            "Amadou": "Amadou",
-            "Bakary": "Bakary",
-            "Ngolo": "Ngolo",
-            "Ibrahima": "Ibrahima",
-            "Amara": "Amara"
         }
-        for name, attr_name in all_speakers.items():
-            try:
-                if hasattr(Speakers, attr_name):
-                    available_speakers[name] = getattr(Speakers, attr_name)
-            except:
-                continue
-        if available_speakers:
-            logger.info(f"Loaded {len(available_speakers)} speakers from new structure: {list(available_speakers.keys())}")
-            return available_speakers
-        else:
-            raise AttributeError("No speakers found in new structure")
     except Exception as e:
-        logger.error(f"Failed to import from new settings structure: {e}")
-        # Fallback to old structure if new one fails
-        try:
-            from maliba_ai.config.speakers import Adame, Moussa, Bourama, Modibo, Seydou, Amadou, Bakary, Ngolo, Ibrahima, Amara
-            logger.info("Using fallback old speaker structure")
-            return {
-                "Adama": Adame,
-                "Moussa": Moussa,
-                "Bourama": Bourama,
-                "Modibo": Modibo,
-                "Seydou": Seydou,
-                "Amadou": Amadou,
-                "Bakary": Bakary,
-                "Ngolo": Ngolo,
-                "Ibrahima": Ibrahima,
-                "Amara": Amara
-            }
-        except Exception as e2:
-            logger.error(f"Failed to import speakers: {e2}")
-            return {}
 @spaces.GPU()
 def initialize_model_once():
@@ -108,8 +79,8 @@ def initialize_model_once():
         logger.info("Initializing Bambara TTS model...")
         start_time = time.time()
-        # Use the new import structure from the README
-        from maliba_ai.tts import BambaraTTSInference
         model = BambaraTTSInference()
         speakers = get_speakers_dict()
@@ -288,9 +259,9 @@ def build_interface():
         gr.Markdown("""
         # 🎤 Bambara Text-to-Speech
-        **Powered by MALIBA-AI**
-        Convert Bambara text to speech using our state-of-the-art TTS model.
         **Bambara** is spoken by millions of people in Mali and West Africa.
         """)
@@ -363,7 +334,7 @@ def build_interface():
             label="Generated Speech",
             type="numpy",
             interactive=False,
-            format="wav"  # Specify WAV format to help with conversion
         )
         status_output = gr.Textbox(
@@ -437,8 +408,7 @@ def build_interface():
 def main():
     """Main function to launch the Gradio interface"""
     logger.info("Starting Bambara TTS Gradio interface.")
-    # DO NOT preload - let it initialize on first request only (like your working version)
     interface = build_interface()
     interface.launch(
         server_name="0.0.0.0",

 if hf_token:
     login(token=hf_token)
+# Global variables for model caching
 _tts_model = None
 _speakers_dict = None
 _model_initialized = False
 _initialization_in_progress = False
 def get_speakers_dict():
+    """Get speakers dictionary using the correct SDK structure"""
     try:
+        # Import the Speakers class (not individual speakers)
         from maliba_ai.config.settings import Speakers
+        # Access all 10 speakers through the Speakers class
+        speakers_dict = {
+            "Adama": Speakers.Adama,
+            "Moussa": Speakers.Moussa,
+            "Bourama": Speakers.Bourama,
+            "Modibo": Speakers.Modibo,
+            "Seydou": Speakers.Seydou,
+            "Amadou": Speakers.Amadou,
+            "Bakary": Speakers.Bakary,
+            "Ngolo": Speakers.Ngolo,
+            "Amara": Speakers.Amara,
+            "Ibrahima": Speakers.Ibrahima
         }
+        logger.info(f"🎤 Successfully loaded {len(speakers_dict)} speakers: {list(speakers_dict.keys())}")
+        return speakers_dict
     except Exception as e:
+        logger.error(f"❌ Failed to import Speakers class: {e}")
+        return {}
 @spaces.GPU()
 def initialize_model_once():
         logger.info("Initializing Bambara TTS model...")
         start_time = time.time()
+        # Use the correct import path
+        from maliba_ai.tts.inference import BambaraTTSInference
         model = BambaraTTSInference()
         speakers = get_speakers_dict()
         gr.Markdown("""
         # 🎤 Bambara Text-to-Speech
+        **Powered by MALIBA-AI** | *First Open-Source Bambara TTS*
+        Convert Bambara text to natural-sounding speech using our state-of-the-art neural TTS system.
         **Bambara** is spoken by millions of people in Mali and West Africa.
         """)
             label="Generated Speech",
             type="numpy",
             interactive=False,
+            format="wav"
         )
         status_output = gr.Textbox(
 def main():
     """Main function to launch the Gradio interface"""
     logger.info("Starting Bambara TTS Gradio interface.")
     interface = build_interface()
     interface.launch(
         server_name="0.0.0.0",