jguerrisi commited on
Commit
4dbbe1d
·
verified ·
1 Parent(s): 4f7f1fc

Update model.py

Browse files
Files changed (1) hide show
  1. model.py +21 -0
model.py CHANGED
@@ -2071,6 +2071,7 @@ multi_lingual_models = {
2071
  "csukuangfj/sherpa-onnx-dolphin-base-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
2072
  "csukuangfj/sherpa-onnx-dolphin-small-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
2073
  "csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_dolphin_ctc_models
 
2074
  }
2075
 
2076
  chinese_english_mixed_models = {
@@ -2195,3 +2196,23 @@ language_to_models = {
2195
  "Tibetan": list(tibetan_models.keys()),
2196
  "Vietnamese": list(vietnamese_models.keys()),
2197
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2071
  "csukuangfj/sherpa-onnx-dolphin-base-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
2072
  "csukuangfj/sherpa-onnx-dolphin-small-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
2073
  "csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_dolphin_ctc_models
2074
+ "csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_nemo_ctc_models,
2075
  }
2076
 
2077
  chinese_english_mixed_models = {
 
2196
  "Tibetan": list(tibetan_models.keys()),
2197
  "Vietnamese": list(vietnamese_models.keys()),
2198
  }
2199
+
2200
+ @lru_cache(maxsize=10)
2201
+ def _get_nemo_ctc_models(repo_id: str, decoding_method: str, num_active_paths: int):
2202
+ nn_model = _get_nn_model_filename(
2203
+ repo_id=repo_id,
2204
+ filename="model.int8.onnx",
2205
+ subfolder=".",
2206
+ )
2207
+ tokens = _get_token_filename(
2208
+ repo_id=repo_id,
2209
+ filename="tokens.txt",
2210
+ subfolder=".",
2211
+ )
2212
+ recognizer = sherpa_onnx.OfflineRecognizer.from_nemo_ctc(
2213
+ tokens=tokens,
2214
+ model=nn_model,
2215
+ num_threads=2,
2216
+ language="es", # Force Spanish
2217
+ )
2218
+ return recognizer