Voice-Chat-AI

Runtime error

App Files Files Community

DHEIVER commited on Feb 16

Commit

d63ff40

verified ·

1 Parent(s): 625f934

Update app.py

Browse files

Files changed (1) hide show

app.py +48 -11

app.py CHANGED Viewed

@@ -130,21 +130,58 @@ def model(text, web_search):
         stream = client1.text_generation(formatted_prompt, max_new_tokens=300, stream=True, details=True, return_full_text=False)
         return "".join([response.token.text for response in stream if response.token.text != "</s>"])
-async def respond(audio, web_search):
     user = transcribe(audio)
     reply = model(user, web_search)
-    communicate = edge_tts.Communicate(reply)
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
         tmp_path = tmp_file.name
         await communicate.save(tmp_path)
-    return tmp_path
-with gr.Blocks() as demo:
-    with gr.Row():
-        web_search = gr.Checkbox(label="Web Search", value=False)
-        input = gr.Audio(label="User Input", sources="microphone", type="filepath")
-        output = gr.Audio(label="AI", autoplay=True)
-        gr.Interface(fn=respond, inputs=[input, web_search], outputs=[output], live=True)
 if __name__ == "__main__":
-    demo.queue(max_size=200).launch()

         stream = client1.text_generation(formatted_prompt, max_new_tokens=300, stream=True, details=True, return_full_text=False)
         return "".join([response.token.text for response in stream if response.token.text != "</s>"])
+async def respond(audio, web_search, voice):
     user = transcribe(audio)
     reply = model(user, web_search)
+    communicate = edge_tts.Communicate(reply, voice=voice)
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
         tmp_path = tmp_file.name
         await communicate.save(tmp_path)
+    return tmp_path, user, reply
+# List of available voices for edge_tts
+voices = ["en-US-JennyNeural", "en-US-GuyNeural", "en-GB-SoniaNeural", "en-AU-NatashaNeural"]
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🎙️ **OpenGPT 4o - Advanced Voice Assistant**")
+    with gr.Tabs():
+        with gr.TabItem("Conversation"):
+            with gr.Row():
+                with gr.Column():
+                    audio_input = gr.Audio(label="🎤 Speak or Upload Audio", sources="microphone", type="filepath")
+                    web_search = gr.Checkbox(label="🔍 Enable Web Search", value=False)
+                    voice = gr.Dropdown(label="🎤 Choose Voice", choices=voices, value="en-US-JennyNeural")
+                    submit_btn = gr.Button("🚀 Submit")
+                with gr.Column():
+                    audio_output = gr.Audio(label="🤖 AI Response", autoplay=True)
+                    user_text = gr.Textbox(label="👤 You Said", interactive=False)
+                    ai_text = gr.Textbox(label="🤖 AI Response", interactive=False)
+        with gr.TabItem("History"):
+            history = gr.Dataframe(headers=["User Input", "AI Response"], interactive=False)
+        with gr.TabItem("Settings"):
+            gr.Markdown("### ⚙️ Settings")
+            max_tokens = gr.Slider(minimum=50, maximum=500, value=300, label="Max Tokens")
+            temperature = gr.Slider(minimum=0.1, maximum=1.0, value=0.7, label="Temperature")
+            gr.Markdown("Adjust the parameters to customize the AI's behavior.")
+    # Store conversation history
+    conversation_history = []
+    def update_history(user_input, ai_response):
+        conversation_history.append([user_input, ai_response])
+        return conversation_history
+    submit_btn.click(
+        fn=respond,
+        inputs=[audio_input, web_search, voice],
+        outputs=[audio_output, user_text, ai_text]
+    ).then(
+        fn=update_history,
+        inputs=[user_text, ai_text],
+        outputs=history
+    )
 if __name__ == "__main__":
+    demo.queue(max_size=200).launch()