Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -14,13 +14,9 @@ model = Wav2Vec2ForCTC.from_pretrained("jonatasgrosman/wav2vec2-large-xlsr-53-it
|
|
14 |
# Function to perform ASR on audio data
|
15 |
def transcribe_audio(audio_data):
|
16 |
# Convert audio data to mono and normalize
|
17 |
-
audio_data = torchaudio.transforms.
|
18 |
audio_data = torchaudio.functional.gain(audio_data, gain_db=5.0)
|
19 |
|
20 |
-
# Resample if needed (Wav2Vec2 model requires 16 kHz sampling rate)
|
21 |
-
if audio_data[1] != 16000:
|
22 |
-
audio_data = torchaudio.transforms.Resample(audio_data[1], 16000)(audio_data[0])
|
23 |
-
|
24 |
# Apply custom preprocessing to the audio data if needed
|
25 |
input_values = processor(audio_data[0].numpy(), return_tensors="pt").input_values
|
26 |
|
|
|
14 |
# Function to perform ASR on audio data
|
15 |
def transcribe_audio(audio_data):
|
16 |
# Convert audio data to mono and normalize
|
17 |
+
audio_data = torchaudio.transforms.Resample(audio_data[1], 16000)(audio_data[0])
|
18 |
audio_data = torchaudio.functional.gain(audio_data, gain_db=5.0)
|
19 |
|
|
|
|
|
|
|
|
|
20 |
# Apply custom preprocessing to the audio data if needed
|
21 |
input_values = processor(audio_data[0].numpy(), return_tensors="pt").input_values
|
22 |
|