csukuangfj commited on
Commit
7d508be
·
1 Parent(s): 7d43f04

add Brazilian Portugues asr models

Browse files
Files changed (1) hide show
  1. model.py +28 -10
model.py CHANGED
@@ -1370,13 +1370,22 @@ def _get_sherpa_onnx_nemo_ctc_models(
1370
  ) -> sherpa_onnx.OfflineRecognizer:
1371
  assert repo_id in [
1372
  "csukuangfj/sherpa-onnx-nemo-parakeet_tdt_ctc_110m-en-36000",
 
 
1373
  ], repo_id
1374
 
1375
- model = _get_nn_model_filename(
1376
- repo_id=repo_id,
1377
- filename="model.onnx",
1378
- subfolder=".",
1379
- )
 
 
 
 
 
 
 
1380
 
1381
  tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
1382
 
@@ -1946,6 +1955,8 @@ chinese_models = {
1946
  # "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-fp16-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
1947
  "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-xlarge-int8-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
1948
  # "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-xlarge-fp16-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
 
 
1949
  "csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09": _get_paraformer_pre_trained_model,
1950
  "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
1951
  "csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09": _get_paraformer_pre_trained_model,
@@ -2072,6 +2083,11 @@ vietnamese_models = {
2072
  "csukuangfj/sherpa-onnx-zipformer-vi-2025-04-20": _get_vietnamese_pretrained_model,
2073
  }
2074
 
 
 
 
 
 
2075
 
2076
  all_models = {
2077
  **multi_lingual_models,
@@ -2090,6 +2106,7 @@ all_models = {
2090
  **korean_models,
2091
  **thai_models,
2092
  **vietnamese_models,
 
2093
  }
2094
 
2095
  language_to_models = {
@@ -2102,14 +2119,15 @@ language_to_models = {
2102
  "Chinese+English+Cantonese+Japanese+Korean": list(
2103
  chinese_cantonese_english_japanese_korean_models.keys()
2104
  ),
2105
- "Cantonese": list(cantonese_models.keys()),
2106
- "Japanese": list(japanese_models.keys()),
2107
- "Tibetan": list(tibetan_models.keys()),
2108
  "Arabic": list(arabic_models.keys()),
2109
- "German": list(german_models.keys()),
2110
  "French": list(french_models.keys()),
2111
- "Russian": list(russian_models.keys()),
 
2112
  "Korean": list(korean_models.keys()),
 
 
2113
  "Thai": list(thai_models.keys()),
 
2114
  "Vietnamese": list(vietnamese_models.keys()),
2115
  }
 
1370
  ) -> sherpa_onnx.OfflineRecognizer:
1371
  assert repo_id in [
1372
  "csukuangfj/sherpa-onnx-nemo-parakeet_tdt_ctc_110m-en-36000",
1373
+ "csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc",
1374
+ "csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc-int8",
1375
  ], repo_id
1376
 
1377
+ if "int8" in repo_id:
1378
+ model = _get_nn_model_filename(
1379
+ repo_id=repo_id,
1380
+ filename="model.onnx",
1381
+ subfolder=".",
1382
+ )
1383
+ else:
1384
+ model = _get_nn_model_filename(
1385
+ repo_id=repo_id,
1386
+ filename="model.int8.onnx",
1387
+ subfolder=".",
1388
+ )
1389
 
1390
  tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
1391
 
 
1955
  # "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-fp16-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
1956
  "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-xlarge-int8-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
1957
  # "csukuangfj/sherpa-onnx-streaming-zipformer-ctc-zh-xlarge-fp16-2025-06-30": _get_streaming_zipformer_ctc_pre_trained_model,
1958
+ "csukuangfj/sherpa-onnx-zipformer-ctc-zh-int8-2025-07-03": _get_non_streaming_zipformer_ctc_pre_trained_model,
1959
+ "csukuangfj/sherpa-onnx-zipformer-ctc-zh-2025-07-03": _get_non_streaming_zipformer_ctc_pre_trained_model,
1960
  "csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09": _get_paraformer_pre_trained_model,
1961
  "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
1962
  "csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09": _get_paraformer_pre_trained_model,
 
2083
  "csukuangfj/sherpa-onnx-zipformer-vi-2025-04-20": _get_vietnamese_pretrained_model,
2084
  }
2085
 
2086
+ portuguese_brazlian_models = {
2087
+ "csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_ctc_models,
2088
+ "csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc-int8": _get_sherpa_onnx_nemo_ctc_models,
2089
+ }
2090
+
2091
 
2092
  all_models = {
2093
  **multi_lingual_models,
 
2106
  **korean_models,
2107
  **thai_models,
2108
  **vietnamese_models,
2109
+ **portuguese_brazlian_models,
2110
  }
2111
 
2112
  language_to_models = {
 
2119
  "Chinese+English+Cantonese+Japanese+Korean": list(
2120
  chinese_cantonese_english_japanese_korean_models.keys()
2121
  ),
 
 
 
2122
  "Arabic": list(arabic_models.keys()),
2123
+ "Cantonese": list(cantonese_models.keys()),
2124
  "French": list(french_models.keys()),
2125
+ "German": list(german_models.keys()),
2126
+ "Japanese": list(japanese_models.keys()),
2127
  "Korean": list(korean_models.keys()),
2128
+ "Portuguese (Brazilian)": list(portuguese_brazlian_models.keys()),
2129
+ "Russian": list(russian_models.keys()),
2130
  "Thai": list(thai_models.keys()),
2131
+ "Tibetan": list(tibetan_models.keys()),
2132
  "Vietnamese": list(vietnamese_models.keys()),
2133
  }