MusIre commited on
Commit
3a161de
·
1 Parent(s): 9802090

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -25,7 +25,8 @@ def preprocess_audio(audio_data, sampling_rate=16_000):
25
  def transcribe_audio(audio_data):
26
  input_features = preprocess_audio(audio_data)
27
  input_values = torch.tensor(input_features["input_values"]).unsqueeze(0) # Add batch dimension
28
- # Reshape the tensor to match the expected shape [batch_size, num_channels, sequence_length]
 
29
  input_values = input_values.permute(0, 2, 1)
30
  predicted_ids = model.generate(input_values)
31
  transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)
 
25
  def transcribe_audio(audio_data):
26
  input_features = preprocess_audio(audio_data)
27
  input_values = torch.tensor(input_features["input_values"]).unsqueeze(0) # Add batch dimension
28
+ # Ensure the input tensor has the correct shape
29
+ input_values = input_values.view(1, -1, 1)
30
  input_values = input_values.permute(0, 2, 1)
31
  predicted_ids = model.generate(input_values)
32
  transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)