Update model.py
Browse files
model.py
CHANGED
|
@@ -2071,6 +2071,7 @@ multi_lingual_models = {
|
|
| 2071 |
"csukuangfj/sherpa-onnx-dolphin-base-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
|
| 2072 |
"csukuangfj/sherpa-onnx-dolphin-small-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
|
| 2073 |
"csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_dolphin_ctc_models
|
|
|
|
| 2074 |
}
|
| 2075 |
|
| 2076 |
chinese_english_mixed_models = {
|
|
@@ -2195,3 +2196,23 @@ language_to_models = {
|
|
| 2195 |
"Tibetan": list(tibetan_models.keys()),
|
| 2196 |
"Vietnamese": list(vietnamese_models.keys()),
|
| 2197 |
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2071 |
"csukuangfj/sherpa-onnx-dolphin-base-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
|
| 2072 |
"csukuangfj/sherpa-onnx-dolphin-small-ctc-multi-lang-2025-04-02": _get_dolphin_ctc_models,
|
| 2073 |
"csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_dolphin_ctc_models
|
| 2074 |
+
"csukuangfj/sherpa-onnx-nemo-canary-180m-flash-en-es-de-fr-int8": _get_nemo_ctc_models,
|
| 2075 |
}
|
| 2076 |
|
| 2077 |
chinese_english_mixed_models = {
|
|
|
|
| 2196 |
"Tibetan": list(tibetan_models.keys()),
|
| 2197 |
"Vietnamese": list(vietnamese_models.keys()),
|
| 2198 |
}
|
| 2199 |
+
|
| 2200 |
+
@lru_cache(maxsize=10)
|
| 2201 |
+
def _get_nemo_ctc_models(repo_id: str, decoding_method: str, num_active_paths: int):
|
| 2202 |
+
nn_model = _get_nn_model_filename(
|
| 2203 |
+
repo_id=repo_id,
|
| 2204 |
+
filename="model.int8.onnx",
|
| 2205 |
+
subfolder=".",
|
| 2206 |
+
)
|
| 2207 |
+
tokens = _get_token_filename(
|
| 2208 |
+
repo_id=repo_id,
|
| 2209 |
+
filename="tokens.txt",
|
| 2210 |
+
subfolder=".",
|
| 2211 |
+
)
|
| 2212 |
+
recognizer = sherpa_onnx.OfflineRecognizer.from_nemo_ctc(
|
| 2213 |
+
tokens=tokens,
|
| 2214 |
+
model=nn_model,
|
| 2215 |
+
num_threads=2,
|
| 2216 |
+
language="es", # Force Spanish
|
| 2217 |
+
)
|
| 2218 |
+
return recognizer
|