Spaces:

milwright
/

speech-buddy

Sleeping

App Files Files Community

milwright commited on 4 days ago

Commit

71a2826

verified ·

1 Parent(s): 65c037b

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -151

app.py CHANGED Viewed

@@ -9,16 +9,6 @@ from datetime import datetime
 import urllib.parse
 from pathlib import Path
 from typing import List, Dict, Optional, Any, Tuple
-import base64
-import io
-# Try to import gradio_client for TTS support
-try:
-    from gradio_client import Client
-    GRADIO_CLIENT_AVAILABLE = True
-except ImportError:
-    GRADIO_CLIENT_AVAILABLE = False
-    print("Warning: gradio_client not available. TTS features will be disabled.")
 # Configuration
@@ -32,7 +22,7 @@ DEFAULT_CONFIG = {
     'system_prompt': "You are Domenico from Sicily, a Juventus football fan, native Italian speaker serving as a conversational partner for university students in an Italian 101 class. Students will interact and converse with you in Italian, and you must respond EXCLUSIVELY IN ITALIAN without providing English translations, using vocabulary appropriate for beginner-level Italian 101 students. Focus your responses on topics suitable for beginners such as sports, daily life, routines, food, numbers, and hobbies. When students make errors, model the correct forms naturally in your response without explicitly pointing out mistakes, allowing them to learn through exposure to proper usage. Recognize when students demonstrate more advanced abilities and adjust your language complexity accordingly, while ensuring your Italian remains error-free. Keep all responses between 5-50 words, making sure sentences are grammatically complete. Limit all verb conjugations to the present tense only, avoiding all other verb forms and tenses. Address students using the informal second-person singular 'tu' form.",
     'temperature': 0.5,
     'max_tokens': 250,
-    'model': 'google/gemma-3-27b-it',
     'api_key_var': 'API_KEY',
     'theme': 'Default',
     'grounding_urls': ["https://www.pnac.org/wp-content/uploads/Italian-Study-Guide.pdf"],
@@ -40,8 +30,6 @@ DEFAULT_CONFIG = {
     'enable_file_upload': True,
     'examples': ['Ciao! Come stai oggi?', 'Mi piace giocare a calcio. E tu?', 'Cosa mangi di solito a colazione?', 'A che ora ti svegli la mattina?', 'Qual è il tuo sport preferito?'],
     'language': 'Italian',
-    'enable_tts': False,
-    'tts_spaces': ['facebook/mms-tts-eng', 'microsoft/speecht5-tts-demo'],
     'locked': False
 }
@@ -294,80 +282,6 @@ def process_file_upload(file_path: str) -> str:
 _url_content_cache = {}
-def generate_tts(text: str, hf_token: Optional[str] = None) -> Optional[Tuple[int, Any]]:
-    """
-    Generate text-to-speech audio using HuggingFace Spaces via gradio_client.
-    Uses multiple fallback options for maximum reliability.
-    Returns: Tuple of (sample_rate, audio_array) or None if failed
-    """
-    if not GRADIO_CLIENT_AVAILABLE:
-        return None
-    if not text or not text.strip():
-        return None
-    # Get HF token from environment if not provided
-    if not hf_token:
-        hf_token = os.getenv("HF_TOKEN")
-    # Get TTS spaces from config
-    tts_spaces = DEFAULT_CONFIG.get('tts_spaces', [])
-    if not tts_spaces:
-        # Default fallback spaces if none configured
-        tts_spaces = [
-            "facebook/mms-tts-eng",
-            "microsoft/speecht5-tts-demo",
-            "coqui/XTTS",
-            "myshell-ai/OpenVoice"
-        ]
-    # Limit text length for TTS
-    max_text_length = 500
-    if len(text) > max_text_length:
-        text = text[:max_text_length] + "..."
-    # Try each TTS space in order
-    for space_name in tts_spaces:
-        try:
-            print(f"Trying TTS space: {space_name}")
-            client = Client(space_name, hf_token=hf_token)
-            # Different spaces have different APIs, try common patterns
-            try:
-                # Pattern 1: Simple text input
-                result = client.predict(text, api_name="/predict")
-            except:
-                try:
-                    # Pattern 2: Text + language
-                    result = client.predict(text, "en", api_name="/predict")
-                except:
-                    try:
-                        # Pattern 3: Text + voice/speaker
-                        result = client.predict(text, "default", api_name="/predict")
-                    except:
-                        continue
-            # Handle different return types
-            if isinstance(result, str) and os.path.exists(result):
-                # Result is a file path
-                import soundfile as sf
-                audio_data, sample_rate = sf.read(result)
-                return (sample_rate, audio_data)
-            elif isinstance(result, tuple) and len(result) >= 2:
-                # Result is (sample_rate, audio_array)
-                return result
-            elif hasattr(result, 'get') and 'audio' in result:
-                # Result is a dict with audio key
-                return result['audio']
-        except Exception as e:
-            print(f"TTS failed with {space_name}: {str(e)}")
-            continue
-    return None
 def get_grounding_context() -> str:
     """Get grounding context from configured URLs with caching"""
     urls = GROUNDING_URLS
@@ -556,11 +470,8 @@ Get your API key at: https://openrouter.ai/keys"""
         )
         if response.status_code == 200:
-            try:
-                result = response.json()
-                ai_response = result['choices'][0]['message']['content']
-            except (json.JSONDecodeError, KeyError) as e:
-                return f"❌ Error parsing API response: {str(e)}"
             # Add file notification if files were uploaded
             if file_notification:
@@ -568,11 +479,8 @@ Get your API key at: https://openrouter.ai/keys"""
             return ai_response
         else:
-            try:
-                error_data = response.json()
-                error_message = error_data.get('error', {}).get('message', 'Unknown error')
-            except:
-                error_message = response.text if response.text else 'Unknown error'
             return f"❌ API Error ({response.status_code}): {error_message}"
     except requests.exceptions.Timeout:
@@ -610,7 +518,6 @@ def verify_hf_token_access() -> Tuple[bool, str]:
         return False, f"Error verifying HF token: {str(e)}"
 # Create main interface with clean tab structure
 def create_interface():
     """Create the Gradio interface with clean tab structure"""
@@ -683,19 +590,6 @@ def create_interface():
                             size="sm"
                         )
-                    # TTS functionality
-                    if DEFAULT_CONFIG.get('enable_tts', False) and GRADIO_CLIENT_AVAILABLE:
-                        with gr.Row():
-                            tts_btn = gr.Button("🔊 Read Last Response", variant="secondary", size="sm")
-                            tts_status = gr.Textbox(label="TTS Status", visible=False, interactive=False)
-                        audio_output = gr.Audio(
-                            label="TTS Output",
-                            visible=False,
-                            autoplay=True,
-                            type="numpy"
-                        )
                     # Export handler
                     def prepare_export():
                         if not chat_history_store:
@@ -719,46 +613,6 @@ def create_interface():
                         outputs=[export_btn]
                     )
-                    # TTS handler
-                    if DEFAULT_CONFIG.get('enable_tts', False) and GRADIO_CLIENT_AVAILABLE:
-                        def handle_tts(chat_history):
-                            """Generate TTS for the last assistant message"""
-                            if not chat_history:
-                                return None, gr.update(value="No messages to read", visible=True)
-                            # Find last assistant message
-                            last_assistant_msg = None
-                            for msg in reversed(chat_history):
-                                if msg.get("role") == "assistant":
-                                    last_assistant_msg = msg.get("content", "")
-                                    break
-                            if not last_assistant_msg:
-                                return None, gr.update(value="No assistant message found", visible=True)
-                            # Update status
-                            status_msg = "🎯 Generating audio..."
-                            # Generate TTS
-                            audio_result = generate_tts(last_assistant_msg)
-                            if audio_result:
-                                return (
-                                    gr.update(value=audio_result, visible=True),
-                                    gr.update(value="✅ Audio generated successfully", visible=True)
-                                )
-                            else:
-                                return (
-                                    None,
-                                    gr.update(value="❌ TTS generation failed", visible=True)
-                                )
-                        tts_btn.click(
-                            handle_tts,
-                            inputs=[chatbot],
-                            outputs=[audio_output, tts_status]
-                        )
                     # Examples section
                     if examples:
                         gr.Examples(examples=examples, inputs=msg)

 import urllib.parse
 from pathlib import Path
 from typing import List, Dict, Optional, Any, Tuple
 # Configuration
     'system_prompt': "You are Domenico from Sicily, a Juventus football fan, native Italian speaker serving as a conversational partner for university students in an Italian 101 class. Students will interact and converse with you in Italian, and you must respond EXCLUSIVELY IN ITALIAN without providing English translations, using vocabulary appropriate for beginner-level Italian 101 students. Focus your responses on topics suitable for beginners such as sports, daily life, routines, food, numbers, and hobbies. When students make errors, model the correct forms naturally in your response without explicitly pointing out mistakes, allowing them to learn through exposure to proper usage. Recognize when students demonstrate more advanced abilities and adjust your language complexity accordingly, while ensuring your Italian remains error-free. Keep all responses between 5-50 words, making sure sentences are grammatically complete. Limit all verb conjugations to the present tense only, avoiding all other verb forms and tenses. Address students using the informal second-person singular 'tu' form.",
     'temperature': 0.5,
     'max_tokens': 250,
+    'model': 'openai/gpt-oss-120b',
     'api_key_var': 'API_KEY',
     'theme': 'Default',
     'grounding_urls': ["https://www.pnac.org/wp-content/uploads/Italian-Study-Guide.pdf"],
     'enable_file_upload': True,
     'examples': ['Ciao! Come stai oggi?', 'Mi piace giocare a calcio. E tu?', 'Cosa mangi di solito a colazione?', 'A che ora ti svegli la mattina?', 'Qual è il tuo sport preferito?'],
     'language': 'Italian',
     'locked': False
 }
 _url_content_cache = {}
 def get_grounding_context() -> str:
     """Get grounding context from configured URLs with caching"""
     urls = GROUNDING_URLS
         )
         if response.status_code == 200:
+            result = response.json()
+            ai_response = result['choices'][0]['message']['content']
             # Add file notification if files were uploaded
             if file_notification:
             return ai_response
         else:
+            error_data = response.json()
+            error_message = error_data.get('error', {}).get('message', 'Unknown error')
             return f"❌ API Error ({response.status_code}): {error_message}"
     except requests.exceptions.Timeout:
         return False, f"Error verifying HF token: {str(e)}"
 # Create main interface with clean tab structure
 def create_interface():
     """Create the Gradio interface with clean tab structure"""
                             size="sm"
                         )
                     # Export handler
                     def prepare_export():
                         if not chat_history_store:
                         outputs=[export_btn]
                     )
                     # Examples section
                     if examples:
                         gr.Examples(examples=examples, inputs=msg)