from transformers import pipeline | |
asr = pipeline("automatic-speech-recognition", model="ZeeshanGeoPk/haitian-speech-to-text") | |
def transcribe(audio): | |
return asr(audio)["text"] | |
import gradio as gr | |
gr.Interface(fn=transcribe, inputs=gr.Audio(type="filepath"), outputs="text").launch() | |