File size: 727 Bytes
6a81069
740beea
 
6a81069
8d444a7
 
1f036ab
6a81069
8d444a7
 
 
 
6a81069
740beea
8d444a7
 
 
 
 
 
 
6a81069
740beea
 
 
8d444a7
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
import gradio as gr
import torch
from transformers import pipeline

# Initialize the ASR pipeline for Bulgarian
asr_pipeline = pipeline("automatic-speech-recognition", model="infinitejoy/wav2vec2-large-xls-r-300m-bulgarian")


# ASR λ³€ν™˜ ν•¨μˆ˜ (speech-to-text conversion)
def asr_generate(audio):
    transcription = asr_pipeline(audio)["text"]
    return transcription

# Gradio μΈν„°νŽ˜μ΄μŠ€ 생성
iface = gr.Interface(
    fn=asr_generate, 
    inputs=gr.Audio(source="microphone", type="filepath"), 
    outputs="text",
    title="Bulgarian Speech Recognition",
    description="Upload or record audio in Bulgarian to get the transcription."
)

# μΈν„°νŽ˜μ΄μŠ€ μ‹€ν–‰
if __name__ == "__main__":
    iface.launch()