Spaces:

Kvikontent
/

text2speech

Runtime error

Kvikontent commited on Oct 8, 2023

Commit

78f9221

1 Parent(s): 4151c7e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,13 +1,21 @@
 import gradio as gr
-from transformers import pipeline
-# Load the text-to-speech pipeline from Hugging Face
-pipe = pipeline("text2speech", model="suno/bark-small")
 # Define the Gradio interface
 def text_to_speech(text):
-    # Generate speech from the input text using the loaded pipeline
-    speech = pipe(text)[0]["speech"]
     return speech
@@ -17,4 +25,4 @@ iface = gr.Interface(fn=text_to_speech, inputs="text", outputs="audio",
                      description="Enter text to hear the speech")
 # Launch the Gradio interface
-iface.launch()

 import gradio as gr
+from transformers import AutoModelForCausalLM, AutoTokenizer
+# Load the model and tokenizer
+model_name = "suno/bark-small"
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name)
 # Define the Gradio interface
 def text_to_speech(text):
+    # Tokenize the input text
+    inputs = tokenizer.encode(text, return_tensors="pt")
+    # Generate speech from the input text using the loaded model
+    outputs = model.generate(inputs)
+    # Convert the generated speech tensor to audio format
+    speech = gradio.inputs.Audio(outputs)
     return speech
                      description="Enter text to hear the speech")
 # Launch the Gradio interface
+iface.launch()