Commit
·
7d508be
1
Parent(s):
7d43f04
add Brazilian Portugues asr models
Browse files
model.py
CHANGED
@@ -1370,13 +1370,22 @@ def _get_sherpa_onnx_nemo_ctc_models(
|
|
1370 |
) -> sherpa_onnx.OfflineRecognizer:
|
1371 |
assert repo_id in [
|
1372 |
"csukuangfj/sherpa-onnx-nemo-parakeet_tdt_ctc_110m-en-36000",
|
|
|
|
|
1373 |
], repo_id
|
1374 |
|
1375 |
-
|
1376 |
-
|
1377 |
-
|
1378 |
-
|
1379 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1380 |
|
1381 |
tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
|
1382 |
|
@@ -1946,6 +1955,8 @@ chinese_models = {
|
|
1946 |
# "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-fp16-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
|
1947 |
"csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-xlarge-int8-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
|
1948 |
# "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-xlarge-fp16-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
|
|
|
|
|
1949 |
"csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09": _get_paraformer_pre_trained_model,
|
1950 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
1951 |
"csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09": _get_paraformer_pre_trained_model,
|
@@ -2072,6 +2083,11 @@ vietnamese_models = {
|
|
2072 |
"csukuangfj/sherpa-onnx-zipformer-vi-2025-04-20": _get_vietnamese_pretrained_model,
|
2073 |
}
|
2074 |
|
|
|
|
|
|
|
|
|
|
|
2075 |
|
2076 |
all_models = {
|
2077 |
**multi_lingual_models,
|
@@ -2090,6 +2106,7 @@ all_models = {
|
|
2090 |
**korean_models,
|
2091 |
**thai_models,
|
2092 |
**vietnamese_models,
|
|
|
2093 |
}
|
2094 |
|
2095 |
language_to_models = {
|
@@ -2102,14 +2119,15 @@ language_to_models = {
|
|
2102 |
"Chinese+English+Cantonese+Japanese+Korean": list(
|
2103 |
chinese_cantonese_english_japanese_korean_models.keys()
|
2104 |
),
|
2105 |
-
"Cantonese": list(cantonese_models.keys()),
|
2106 |
-
"Japanese": list(japanese_models.keys()),
|
2107 |
-
"Tibetan": list(tibetan_models.keys()),
|
2108 |
"Arabic": list(arabic_models.keys()),
|
2109 |
-
"
|
2110 |
"French": list(french_models.keys()),
|
2111 |
-
"
|
|
|
2112 |
"Korean": list(korean_models.keys()),
|
|
|
|
|
2113 |
"Thai": list(thai_models.keys()),
|
|
|
2114 |
"Vietnamese": list(vietnamese_models.keys()),
|
2115 |
}
|
|
|
1370 |
) -> sherpa_onnx.OfflineRecognizer:
|
1371 |
assert repo_id in [
|
1372 |
"csukuangfj/sherpa-onnx-nemo-parakeet_tdt_ctc_110m-en-36000",
|
1373 |
+
"csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc",
|
1374 |
+
"csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc-int8",
|
1375 |
], repo_id
|
1376 |
|
1377 |
+
if "int8" in repo_id:
|
1378 |
+
model = _get_nn_model_filename(
|
1379 |
+
repo_id=repo_id,
|
1380 |
+
filename="model.onnx",
|
1381 |
+
subfolder=".",
|
1382 |
+
)
|
1383 |
+
else:
|
1384 |
+
model = _get_nn_model_filename(
|
1385 |
+
repo_id=repo_id,
|
1386 |
+
filename="model.int8.onnx",
|
1387 |
+
subfolder=".",
|
1388 |
+
)
|
1389 |
|
1390 |
tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
|
1391 |
|
|
|
1955 |
# "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-fp16-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
|
1956 |
"csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-xlarge-int8-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
|
1957 |
# "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-xlarge-fp16-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
|
1958 |
+
"csukuangfj/sherpa-onnx-zipformer-ctc-zh-int8-2025-07-03": _get_non_streaming_zipformer_ctc_pre_trained_model,
|
1959 |
+
"csukuangfj/sherpa-onnx-zipformer-ctc-zh-2025-07-03": _get_non_streaming_zipformer_ctc_pre_trained_model,
|
1960 |
"csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09": _get_paraformer_pre_trained_model,
|
1961 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
1962 |
"csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09": _get_paraformer_pre_trained_model,
|
|
|
2083 |
"csukuangfj/sherpa-onnx-zipformer-vi-2025-04-20": _get_vietnamese_pretrained_model,
|
2084 |
}
|
2085 |
|
2086 |
+
portuguese_brazlian_models = {
|
2087 |
+
"csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_ctc_models,
|
2088 |
+
"csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc-int8": _get_sherpa_onnx_nemo_ctc_models,
|
2089 |
+
}
|
2090 |
+
|
2091 |
|
2092 |
all_models = {
|
2093 |
**multi_lingual_models,
|
|
|
2106 |
**korean_models,
|
2107 |
**thai_models,
|
2108 |
**vietnamese_models,
|
2109 |
+
**portuguese_brazlian_models,
|
2110 |
}
|
2111 |
|
2112 |
language_to_models = {
|
|
|
2119 |
"Chinese+English+Cantonese+Japanese+Korean": list(
|
2120 |
chinese_cantonese_english_japanese_korean_models.keys()
|
2121 |
),
|
|
|
|
|
|
|
2122 |
"Arabic": list(arabic_models.keys()),
|
2123 |
+
"Cantonese": list(cantonese_models.keys()),
|
2124 |
"French": list(french_models.keys()),
|
2125 |
+
"German": list(german_models.keys()),
|
2126 |
+
"Japanese": list(japanese_models.keys()),
|
2127 |
"Korean": list(korean_models.keys()),
|
2128 |
+
"Portuguese (Brazilian)": list(portuguese_brazlian_models.keys()),
|
2129 |
+
"Russian": list(russian_models.keys()),
|
2130 |
"Thai": list(thai_models.keys()),
|
2131 |
+
"Tibetan": list(tibetan_models.keys()),
|
2132 |
"Vietnamese": list(vietnamese_models.keys()),
|
2133 |
}
|