Update app.py
Browse files
app.py
CHANGED
@@ -27,7 +27,7 @@ huggingface_token = os.environ["huggingface_token"]
|
|
27 |
model = WhisperModel.from_pretrained("mskov/whisper_miso", use_auth_token=huggingface_token)
|
28 |
feature_extractor = AutoFeatureExtractor.from_pretrained("mskov/whisper_miso", use_auth_token=huggingface_token)
|
29 |
ds = load_dataset("mskov/ESC50", split="test")
|
30 |
-
inputs = feature_extractor(ds[0]["audio"]["
|
31 |
input_features = inputs.input_features
|
32 |
decoder_input_ids = torch.tensor([[1, 1]]) * model.config.decoder_start_token_id
|
33 |
last_hidden_state = model(input_features, decoder_input_ids=decoder_input_ids).last_hidden_state
|
|
|
27 |
model = WhisperModel.from_pretrained("mskov/whisper_miso", use_auth_token=huggingface_token)
|
28 |
feature_extractor = AutoFeatureExtractor.from_pretrained("mskov/whisper_miso", use_auth_token=huggingface_token)
|
29 |
ds = load_dataset("mskov/ESC50", split="test")
|
30 |
+
inputs = feature_extractor(ds[0]["audio"]["file"], return_tensors="pt")
|
31 |
input_features = inputs.input_features
|
32 |
decoder_input_ids = torch.tensor([[1, 1]]) * model.config.decoder_start_token_id
|
33 |
last_hidden_state = model(input_features, decoder_input_ids=decoder_input_ids).last_hidden_state
|