Commit
·
fe86211
1
Parent(s):
2a1e9c0
add a russian model
Browse files- model.py +26 -0
- requirements.txt +1 -1
model.py
CHANGED
@@ -536,6 +536,31 @@ def _get_russian_pre_trained_model_ctc(
|
|
536 |
return recognizer
|
537 |
|
538 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
539 |
@lru_cache(maxsize=10)
|
540 |
def _get_russian_pre_trained_model(
|
541 |
repo_id: str, decoding_method: str, num_active_paths: int
|
@@ -2206,6 +2231,7 @@ russian_models = {
|
|
2206 |
"csukuangfj/sherpa-onnx-nemo-ctc-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model_ctc,
|
2207 |
"csukuangfj/sherpa-onnx-nemo-transducer-giga-am-russian-2024-10-24": _get_russian_pre_trained_model,
|
2208 |
"csukuangfj/sherpa-onnx-nemo-ctc-giga-am-russian-2024-10-24": _get_russian_pre_trained_model_ctc,
|
|
|
2209 |
"alphacep/vosk-model-ru": _get_russian_pre_trained_model,
|
2210 |
"alphacep/vosk-model-small-ru": _get_russian_pre_trained_model,
|
2211 |
"csukuangfj/sherpa-onnx-streaming-zipformer-small-ru-vosk-int8-2025-08-16": _get_streaming_vosk_pre_trained_model,
|
|
|
536 |
return recognizer
|
537 |
|
538 |
|
539 |
+
@lru_cache(maxsize=10)
|
540 |
+
def _get_sherpa_onnx_t_one_streaming_ctc(
|
541 |
+
repo_id: str, decoding_method: str, num_active_paths: int
|
542 |
+
) -> sherpa_onnx.OnlineRecognizer:
|
543 |
+
assert repo_id in (
|
544 |
+
"csukuangfj/sherpa-onnx-streaming-t-one-russian-2025-09-08",
|
545 |
+
), repo_id
|
546 |
+
|
547 |
+
model = _get_nn_model_filename(
|
548 |
+
repo_id=repo_id,
|
549 |
+
filename="model.onnx",
|
550 |
+
subfolder=".",
|
551 |
+
)
|
552 |
+
|
553 |
+
tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
|
554 |
+
|
555 |
+
recognizer = sherpa_onnx.OnlineRecognizer.from_t_one_ctc(
|
556 |
+
model=model,
|
557 |
+
tokens=tokens,
|
558 |
+
num_threads=2,
|
559 |
+
)
|
560 |
+
|
561 |
+
return recognizer
|
562 |
+
|
563 |
+
|
564 |
@lru_cache(maxsize=10)
|
565 |
def _get_russian_pre_trained_model(
|
566 |
repo_id: str, decoding_method: str, num_active_paths: int
|
|
|
2231 |
"csukuangfj/sherpa-onnx-nemo-ctc-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model_ctc,
|
2232 |
"csukuangfj/sherpa-onnx-nemo-transducer-giga-am-russian-2024-10-24": _get_russian_pre_trained_model,
|
2233 |
"csukuangfj/sherpa-onnx-nemo-ctc-giga-am-russian-2024-10-24": _get_russian_pre_trained_model_ctc,
|
2234 |
+
"csukuangfj/sherpa-onnx-streaming-t-one-russian-2025-09-08": _get_sherpa_onnx_t_one_streaming_ctc,
|
2235 |
"alphacep/vosk-model-ru": _get_russian_pre_trained_model,
|
2236 |
"alphacep/vosk-model-small-ru": _get_russian_pre_trained_model,
|
2237 |
"csukuangfj/sherpa-onnx-streaming-zipformer-small-ru-vosk-int8-2025-08-16": _get_streaming_vosk_pre_trained_model,
|
requirements.txt
CHANGED
@@ -10,6 +10,6 @@ numpy<2
|
|
10 |
|
11 |
huggingface_hub
|
12 |
|
13 |
-
https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/cpu/1.12.
|
14 |
|
15 |
#sherpa-onnx>=1.12.6
|
|
|
10 |
|
11 |
huggingface_hub
|
12 |
|
13 |
+
https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/cpu/1.12.11/sherpa_onnx-1.12.11-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.whl
|
14 |
|
15 |
#sherpa-onnx>=1.12.6
|