Update model.py
Browse files
model.py
CHANGED
@@ -2071,6 +2071,7 @@ multi_lingual_models = {
|
|
2071 |
"csukuangfj/sherpa-onnx-dolphin-base-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
|
2072 |
"csukuangfj/sherpa-onnx-dolphin-small-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
|
2073 |
"csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_dolphin_ctc_models
|
|
|
2074 |
}
|
2075 |
|
2076 |
chinese_english_mixed_models = {
|
@@ -2195,3 +2196,23 @@ language_to_models = {
|
|
2195 |
"Tibetan": list(tibetan_models.keys()),
|
2196 |
"Vietnamese": list(vietnamese_models.keys()),
|
2197 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2071 |
"csukuangfj/sherpa-onnx-dolphin-base-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
|
2072 |
"csukuangfj/sherpa-onnx-dolphin-small-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
|
2073 |
"csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_dolphin_ctc_models
|
2074 |
+
"csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_nemo_ctc_models,
|
2075 |
}
|
2076 |
|
2077 |
chinese_english_mixed_models = {
|
|
|
2196 |
"Tibetan": list(tibetan_models.keys()),
|
2197 |
"Vietnamese": list(vietnamese_models.keys()),
|
2198 |
}
|
2199 |
+
|
2200 |
+
@lru_cache(maxsize=10)
|
2201 |
+
def _get_nemo_ctc_models(repo_id: str, decoding_method: str, num_active_paths: int):
|
2202 |
+
nn_model = _get_nn_model_filename(
|
2203 |
+
repo_id=repo_id,
|
2204 |
+
filename="model.int8.onnx",
|
2205 |
+
subfolder=".",
|
2206 |
+
)
|
2207 |
+
tokens = _get_token_filename(
|
2208 |
+
repo_id=repo_id,
|
2209 |
+
filename="tokens.txt",
|
2210 |
+
subfolder=".",
|
2211 |
+
)
|
2212 |
+
recognizer = sherpa_onnx.OfflineRecognizer.from_nemo_ctc(
|
2213 |
+
tokens=tokens,
|
2214 |
+
model=nn_model,
|
2215 |
+
num_threads=2,
|
2216 |
+
language="es", # Force Spanish
|
2217 |
+
)
|
2218 |
+
return recognizer
|