MusIre commited on
Commit
95dcc38
·
1 Parent(s): eb4d23a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -4
app.py CHANGED
@@ -5,7 +5,6 @@ subprocess.run(["pip", "install", "gradio", "--upgrade"])
5
  subprocess.run(["pip", "install", "datasets"])
6
  subprocess.run(["pip", "install", "transformers"])
7
  subprocess.run(["pip", "install", "torch", "torchvision", "torchaudio", "-f", "https://download.pytorch.org/whl/torch_stable.html"])
8
-
9
  import gradio as gr
10
  from transformers import WhisperProcessor, WhisperForConditionalGeneration
11
 
@@ -22,10 +21,13 @@ def preprocess_audio(audio_data):
22
  return processed_data
23
 
24
  # Function to perform ASR on audio data
25
- def transcribe_audio(input_features):
 
 
 
26
  # Generate token ids
27
- predicted_ids = model.generate(**input_features)
28
-
29
  # Decode token ids to text
30
  transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
31
 
 
5
  subprocess.run(["pip", "install", "datasets"])
6
  subprocess.run(["pip", "install", "transformers"])
7
  subprocess.run(["pip", "install", "torch", "torchvision", "torchaudio", "-f", "https://download.pytorch.org/whl/torch_stable.html"])
 
8
  import gradio as gr
9
  from transformers import WhisperProcessor, WhisperForConditionalGeneration
10
 
 
21
  return processed_data
22
 
23
  # Function to perform ASR on audio data
24
+ def transcribe_audio(audio_data):
25
+ # Preprocess the audio data
26
+ input_features = preprocess_audio(audio_data)
27
+
28
  # Generate token ids
29
+ predicted_ids = model.generate(input_features)
30
+
31
  # Decode token ids to text
32
  transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
33