import gradio as gr from transformers import AutoModelForCausalLM, AutoTokenizer # Load the model and tokenizer model_name = "suno/bark-small" tokenizer = AutoTokenizer.from_pretrained(model_name) model = AutoModelForCausalLM.from_pretrained(model_name) # Define the Gradio interface def text_to_speech(text): # Tokenize the input text inputs = tokenizer.encode(text, return_tensors="pt") # Generate speech from the input text using the loaded model outputs = model.generate(inputs) # Convert the generated speech tensor to audio format speech = gradio.inputs.Audio(outputs) return speech # Create the Gradio interface iface = gr.Interface(fn=text_to_speech, inputs="text", outputs="audio", title="Text-to-Speech App", description="Enter text to hear the speech") # Launch the Gradio interface iface.launch()