MusIre commited on
Commit
a1917fb
·
1 Parent(s): 7d6796c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -3
app.py CHANGED
@@ -6,6 +6,7 @@ subprocess.run(["pip", "install", "torchaudio", "--upgrade"])
6
  import gradio as gr
7
  from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
8
  import torchaudio
 
9
 
10
  # Load model and processor
11
  processor = Wav2Vec2Processor.from_pretrained("jonatasgrosman/wav2vec2-large-xlsr-53-italian")
@@ -14,12 +15,15 @@ model = Wav2Vec2ForCTC.from_pretrained("jonatasgrosman/wav2vec2-large-xlsr-53-it
14
  # Function to perform ASR on audio data
15
  def transcribe_audio(audio_data):
16
  print("Received audio data:", audio_data) # Debug print
17
- if audio_data is None:
18
- return "No audio data received."
19
 
20
  try:
 
 
 
21
  # Convert audio data to mono and normalize
22
- audio_data = torchaudio.transforms.Resample(audio_data[1], 16000)(audio_data[0])
23
  audio_data = torchaudio.functional.gain(audio_data, gain_db=5.0)
24
 
25
  # Apply custom preprocessing to the audio data if needed
 
6
  import gradio as gr
7
  from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
8
  import torchaudio
9
+ import torch
10
 
11
  # Load model and processor
12
  processor = Wav2Vec2Processor.from_pretrained("jonatasgrosman/wav2vec2-large-xlsr-53-italian")
 
15
  # Function to perform ASR on audio data
16
  def transcribe_audio(audio_data):
17
  print("Received audio data:", audio_data) # Debug print
18
+ if audio_data is None or len(audio_data) != 2:
19
+ return "Invalid audio data format."
20
 
21
  try:
22
+ # Extract sample rate and audio waveform from the tuple
23
+ sample_rate, waveform = audio_data
24
+
25
  # Convert audio data to mono and normalize
26
+ audio_data = torchaudio.transforms.Resample(sample_rate, 16000)(waveform)
27
  audio_data = torchaudio.functional.gain(audio_data, gain_db=5.0)
28
 
29
  # Apply custom preprocessing to the audio data if needed