csukuangfj commited on
Commit
fe86211
·
1 Parent(s): 2a1e9c0

add a russian model

Browse files
Files changed (2) hide show
  1. model.py +26 -0
  2. requirements.txt +1 -1
model.py CHANGED
@@ -536,6 +536,31 @@ def _get_russian_pre_trained_model_ctc(
536
  return recognizer
537
 
538
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
539
  @lru_cache(maxsize=10)
540
  def _get_russian_pre_trained_model(
541
  repo_id: str, decoding_method: str, num_active_paths: int
@@ -2206,6 +2231,7 @@ russian_models = {
2206
  "csukuangfj/sherpa-onnx-nemo-ctc-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model_ctc,
2207
  "csukuangfj/sherpa-onnx-nemo-transducer-giga-am-russian-2024-10-24": _get_russian_pre_trained_model,
2208
  "csukuangfj/sherpa-onnx-nemo-ctc-giga-am-russian-2024-10-24": _get_russian_pre_trained_model_ctc,
 
2209
  "alphacep/vosk-model-ru": _get_russian_pre_trained_model,
2210
  "alphacep/vosk-model-small-ru": _get_russian_pre_trained_model,
2211
  "csukuangfj/sherpa-onnx-streaming-zipformer-small-ru-vosk-int8-2025-08-16": _get_streaming_vosk_pre_trained_model,
 
536
  return recognizer
537
 
538
 
539
+ @lru_cache(maxsize=10)
540
+ def _get_sherpa_onnx_t_one_streaming_ctc(
541
+ repo_id: str, decoding_method: str, num_active_paths: int
542
+ ) -> sherpa_onnx.OnlineRecognizer:
543
+ assert repo_id in (
544
+ "csukuangfj/sherpa-onnx-streaming-t-one-russian-2025-09-08",
545
+ ), repo_id
546
+
547
+ model = _get_nn_model_filename(
548
+ repo_id=repo_id,
549
+ filename="model.onnx",
550
+ subfolder=".",
551
+ )
552
+
553
+ tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
554
+
555
+ recognizer = sherpa_onnx.OnlineRecognizer.from_t_one_ctc(
556
+ model=model,
557
+ tokens=tokens,
558
+ num_threads=2,
559
+ )
560
+
561
+ return recognizer
562
+
563
+
564
  @lru_cache(maxsize=10)
565
  def _get_russian_pre_trained_model(
566
  repo_id: str, decoding_method: str, num_active_paths: int
 
2231
  "csukuangfj/sherpa-onnx-nemo-ctc-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model_ctc,
2232
  "csukuangfj/sherpa-onnx-nemo-transducer-giga-am-russian-2024-10-24": _get_russian_pre_trained_model,
2233
  "csukuangfj/sherpa-onnx-nemo-ctc-giga-am-russian-2024-10-24": _get_russian_pre_trained_model_ctc,
2234
+ "csukuangfj/sherpa-onnx-streaming-t-one-russian-2025-09-08": _get_sherpa_onnx_t_one_streaming_ctc,
2235
  "alphacep/vosk-model-ru": _get_russian_pre_trained_model,
2236
  "alphacep/vosk-model-small-ru": _get_russian_pre_trained_model,
2237
  "csukuangfj/sherpa-onnx-streaming-zipformer-small-ru-vosk-int8-2025-08-16": _get_streaming_vosk_pre_trained_model,
requirements.txt CHANGED
@@ -10,6 +10,6 @@ numpy<2
10
 
11
  huggingface_hub
12
 
13
- https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/cpu/1.12.9/sherpa_onnx-1.12.9-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.whl
14
 
15
  #sherpa-onnx>=1.12.6
 
10
 
11
  huggingface_hub
12
 
13
+ https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/cpu/1.12.11/sherpa_onnx-1.12.11-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.whl
14
 
15
  #sherpa-onnx>=1.12.6