File size: 804 Bytes
df165b9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
import gradio as gr
from transformers import AutoModelForTextToSpeech, AutoTokenizer
import torch

# Load the model and tokenizer
model = AutoModelForTextToSpeech.from_pretrained("parler-tts/parler_tts")
tokenizer = AutoTokenizer.from_pretrained("parler-tts/parler_tts")

# Define the TTS function
def text_to_speech(text):
    inputs = tokenizer(text, return_tensors="pt")
    speech = model.generate(**inputs)
    
    # Convert to an audio format, e.g., 16kHz waveform
    audio = speech[0].cpu().detach().numpy()
    return 16000, audio  # Sample rate, waveform

# Gradio interface
interface = gr.Interface(
    fn=text_to_speech,
    inputs="text",
    outputs="audio",
    title="Text to Speech",
    description="Convert text to speech using the parler-tts/parler_tts model"
)

interface.launch()