Spaces:

Futuresony
/

Me

Sleeping

Futuresony commited on Jan 14

Commit

179f501

verified ·

1 Parent(s): a2f2a2c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,8 +1,8 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
-import soundfile as sf
 import torch
 from transformers import pipeline
 # Set up your TTS model (as before)
 synthesiser = pipeline("text-to-speech", "Futuresony/output")
@@ -49,11 +49,8 @@ def respond(
     # Generate speech from the text response
     speech = synthesiser(response, forward_params={"speaker_embeddings": speaker_embedding})
-    # Save the speech to a file (you can play it on the fly or return it in other formats like MP3)
-    sf.write("generated_speech.wav", speech["audio"], samplerate=speech["sampling_rate"])
-    return response, "generated_speech.wav"
-    # You can return the text along with speech if needed
 # Create the Gradio interface

 import gradio as gr
 from huggingface_hub import InferenceClient
 import torch
 from transformers import pipeline
+from datasets import load_dataset
 # Set up your TTS model (as before)
 synthesiser = pipeline("text-to-speech", "Futuresony/output")
     # Generate speech from the text response
     speech = synthesiser(response, forward_params={"speaker_embeddings": speaker_embedding})
+    # Return the audio as a Gradio audio component
+    return response, speech["audio"]
 # Create the Gradio interface