bgtts / app.py
englissi's picture
Update app.py
8d444a7 verified
raw
history blame
727 Bytes
import gradio as gr
import torch
from transformers import pipeline
# Initialize the ASR pipeline for Bulgarian
asr_pipeline = pipeline("automatic-speech-recognition", model="infinitejoy/wav2vec2-large-xls-r-300m-bulgarian")
# ASR λ³€ν™˜ ν•¨μˆ˜ (speech-to-text conversion)
def asr_generate(audio):
transcription = asr_pipeline(audio)["text"]
return transcription
# Gradio μΈν„°νŽ˜μ΄μŠ€ 생성
iface = gr.Interface(
fn=asr_generate,
inputs=gr.Audio(source="microphone", type="filepath"),
outputs="text",
title="Bulgarian Speech Recognition",
description="Upload or record audio in Bulgarian to get the transcription."
)
# μΈν„°νŽ˜μ΄μŠ€ μ‹€ν–‰
if __name__ == "__main__":
iface.launch()