Spaces:

Pragnakal
/

ok

Sleeping

Pragnakal commited on Aug 16, 2024

Commit

524b29a

verified ·

1 Parent(s): 6858fd8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,6 +1,31 @@
 import gradio as gr
 def respond(audio_input):
     user_input = transcribe_audio(audio_input)
     text_response, output_path = generate_response(user_input)
@@ -23,7 +48,7 @@ input_audio = gr.Audio(
 gr.Interface(
     fn=respond,
     inputs=input_audio,
-    outputs="text",
     title="Tommy Vercetti Chatbot",
     description="Chat with Tommy Vercetti from GTA Vice City. Get responses in both text and voice!"
 ).launch(debug=True)

 import gradio as gr
+import speech_recognition as sr
+from pydub import AudioSegment
+# Function to transcribe audio to text
+def transcribe_audio(audio_input):
+    recognizer = sr.Recognizer()
+    audio_file = sr.AudioFile(audio_input)
+    with audio_file as source:
+        audio_data = recognizer.record(source)
+    try:
+        text = recognizer.recognize_google(audio_data)
+    except sr.UnknownValueError:
+        text = "Sorry, I couldn't understand the audio."
+    except sr.RequestError:
+        text = "Sorry, there was a problem with the request."
+    return text
+# Function to generate a response (you'll need to implement this)
+def generate_response(user_input):
+    # Placeholder for the text response generation and TTS part
+    text_response = f"Responding as Tommy Vercetti: {user_input}"
+    # Generate audio path based on text_response
+    output_path = "response.wav"  # Placeholder path
+    # Implement TTS and save to output_path
+    return text_response, output_path
+# Function to process the audio input and return both text and audio response
 def respond(audio_input):
     user_input = transcribe_audio(audio_input)
     text_response, output_path = generate_response(user_input)
 gr.Interface(
     fn=respond,
     inputs=input_audio,
+    outputs=["text", "audio"],
     title="Tommy Vercetti Chatbot",
     description="Chat with Tommy Vercetti from GTA Vice City. Get responses in both text and voice!"
 ).launch(debug=True)