MusIre commited on
Commit
9802090
·
1 Parent(s): 0cb2f0c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -0
app.py CHANGED
@@ -25,6 +25,8 @@ def preprocess_audio(audio_data, sampling_rate=16_000):
25
  def transcribe_audio(audio_data):
26
  input_features = preprocess_audio(audio_data)
27
  input_values = torch.tensor(input_features["input_values"]).unsqueeze(0) # Add batch dimension
 
 
28
  predicted_ids = model.generate(input_values)
29
  transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
30
  return transcription[0]
 
25
  def transcribe_audio(audio_data):
26
  input_features = preprocess_audio(audio_data)
27
  input_values = torch.tensor(input_features["input_values"]).unsqueeze(0) # Add batch dimension
28
+ # Reshape the tensor to match the expected shape [batch_size, num_channels, sequence_length]
29
+ input_values = input_values.permute(0, 2, 1)
30
  predicted_ids = model.generate(input_values)
31
  transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
32
  return transcription[0]