Commit
·
fe86211
1
Parent(s):
2a1e9c0
add a russian model
Browse files- model.py +26 -0
- requirements.txt +1 -1
model.py
CHANGED
|
@@ -536,6 +536,31 @@ def _get_russian_pre_trained_model_ctc(
|
|
| 536 |
return recognizer
|
| 537 |
|
| 538 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 539 |
@lru_cache(maxsize=10)
|
| 540 |
def _get_russian_pre_trained_model(
|
| 541 |
repo_id: str, decoding_method: str, num_active_paths: int
|
|
@@ -2206,6 +2231,7 @@ russian_models = {
|
|
| 2206 |
"csukuangfj/sherpa-onnx-nemo-ctc-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model_ctc,
|
| 2207 |
"csukuangfj/sherpa-onnx-nemo-transducer-giga-am-russian-2024-10-24": _get_russian_pre_trained_model,
|
| 2208 |
"csukuangfj/sherpa-onnx-nemo-ctc-giga-am-russian-2024-10-24": _get_russian_pre_trained_model_ctc,
|
|
|
|
| 2209 |
"alphacep/vosk-model-ru": _get_russian_pre_trained_model,
|
| 2210 |
"alphacep/vosk-model-small-ru": _get_russian_pre_trained_model,
|
| 2211 |
"csukuangfj/sherpa-onnx-streaming-zipformer-small-ru-vosk-int8-2025-08-16": _get_streaming_vosk_pre_trained_model,
|
|
|
|
| 536 |
return recognizer
|
| 537 |
|
| 538 |
|
| 539 |
+
@lru_cache(maxsize=10)
|
| 540 |
+
def _get_sherpa_onnx_t_one_streaming_ctc(
|
| 541 |
+
repo_id: str, decoding_method: str, num_active_paths: int
|
| 542 |
+
) -> sherpa_onnx.OnlineRecognizer:
|
| 543 |
+
assert repo_id in (
|
| 544 |
+
"csukuangfj/sherpa-onnx-streaming-t-one-russian-2025-09-08",
|
| 545 |
+
), repo_id
|
| 546 |
+
|
| 547 |
+
model = _get_nn_model_filename(
|
| 548 |
+
repo_id=repo_id,
|
| 549 |
+
filename="model.onnx",
|
| 550 |
+
subfolder=".",
|
| 551 |
+
)
|
| 552 |
+
|
| 553 |
+
tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
|
| 554 |
+
|
| 555 |
+
recognizer = sherpa_onnx.OnlineRecognizer.from_t_one_ctc(
|
| 556 |
+
model=model,
|
| 557 |
+
tokens=tokens,
|
| 558 |
+
num_threads=2,
|
| 559 |
+
)
|
| 560 |
+
|
| 561 |
+
return recognizer
|
| 562 |
+
|
| 563 |
+
|
| 564 |
@lru_cache(maxsize=10)
|
| 565 |
def _get_russian_pre_trained_model(
|
| 566 |
repo_id: str, decoding_method: str, num_active_paths: int
|
|
|
|
| 2231 |
"csukuangfj/sherpa-onnx-nemo-ctc-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model_ctc,
|
| 2232 |
"csukuangfj/sherpa-onnx-nemo-transducer-giga-am-russian-2024-10-24": _get_russian_pre_trained_model,
|
| 2233 |
"csukuangfj/sherpa-onnx-nemo-ctc-giga-am-russian-2024-10-24": _get_russian_pre_trained_model_ctc,
|
| 2234 |
+
"csukuangfj/sherpa-onnx-streaming-t-one-russian-2025-09-08": _get_sherpa_onnx_t_one_streaming_ctc,
|
| 2235 |
"alphacep/vosk-model-ru": _get_russian_pre_trained_model,
|
| 2236 |
"alphacep/vosk-model-small-ru": _get_russian_pre_trained_model,
|
| 2237 |
"csukuangfj/sherpa-onnx-streaming-zipformer-small-ru-vosk-int8-2025-08-16": _get_streaming_vosk_pre_trained_model,
|
requirements.txt
CHANGED
|
@@ -10,6 +10,6 @@ numpy<2
|
|
| 10 |
|
| 11 |
huggingface_hub
|
| 12 |
|
| 13 |
-
https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/cpu/1.12.
|
| 14 |
|
| 15 |
#sherpa-onnx>=1.12.6
|
|
|
|
| 10 |
|
| 11 |
huggingface_hub
|
| 12 |
|
| 13 |
+
https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/cpu/1.12.11/sherpa_onnx-1.12.11-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.whl
|
| 14 |
|
| 15 |
#sherpa-onnx>=1.12.6
|