Spaces:
Build error
Build error
Commit
·
74a5c18
1
Parent(s):
4e478c6
update models
Browse files
model.py
CHANGED
|
@@ -956,6 +956,61 @@ def _get_paraformer_zh_pre_trained_model(
|
|
| 956 |
return recognizer
|
| 957 |
|
| 958 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 959 |
def _get_multi_zh_hans_pre_trained_model(
|
| 960 |
repo_id: str,
|
| 961 |
decoding_method: str,
|
|
@@ -1002,6 +1057,7 @@ chinese_models = {
|
|
| 1002 |
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_zh_pre_trained_model,
|
| 1003 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
| 1004 |
"zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
|
|
|
|
| 1005 |
"desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7": _get_alimeeting_pre_trained_model,
|
| 1006 |
"yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12": _get_aishell2_pretrained_model, # noqa
|
| 1007 |
"yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12": _get_aishell2_pretrained_model, # noqa
|
|
|
|
| 956 |
return recognizer
|
| 957 |
|
| 958 |
|
| 959 |
+
def _get_aishell_pre_trained_model(
|
| 960 |
+
repo_id: str,
|
| 961 |
+
decoding_method: str,
|
| 962 |
+
num_active_paths: int,
|
| 963 |
+
) -> sherpa_onnx.OfflineRecognizer:
|
| 964 |
+
assert repo_id in (
|
| 965 |
+
"zrjin/icefall-asr-aishell-zipformer-large-2023-10-24",
|
| 966 |
+
"zrjin/icefall-asr-aishell-zipformer-small-2023-10-24",
|
| 967 |
+
"zrjin/icefall-asr-aishell-zipformer-2023-10-24",
|
| 968 |
+
), repo_id
|
| 969 |
+
if repo_id == "zrjin/icefall-asr-aishell-zipformer-large-2023-10-24":
|
| 970 |
+
epoch = 56
|
| 971 |
+
avg = 23
|
| 972 |
+
elif repo_id == "zrjin/icefall-asr-aishell-zipformer-small-2023-10-24":
|
| 973 |
+
epoch = 55
|
| 974 |
+
avg = 21
|
| 975 |
+
elif repo_id == "zrjin/icefall-asr-aishell-zipformer-2023-10-24":
|
| 976 |
+
epoch = 55
|
| 977 |
+
avg = 17
|
| 978 |
+
|
| 979 |
+
encoder_model = _get_nn_model_filename(
|
| 980 |
+
repo_id=repo_id,
|
| 981 |
+
filename=f"encoder-epoch-{epoch}-avg-{avg}.onnx",
|
| 982 |
+
subfolder="exp",
|
| 983 |
+
)
|
| 984 |
+
|
| 985 |
+
decoder_model = _get_nn_model_filename(
|
| 986 |
+
repo_id=repo_id,
|
| 987 |
+
filename=f"decoder-epoch-{epoch}-avg-{avg}.onnx",
|
| 988 |
+
subfolder="exp",
|
| 989 |
+
)
|
| 990 |
+
|
| 991 |
+
joiner_model = _get_nn_model_filename(
|
| 992 |
+
repo_id=repo_id,
|
| 993 |
+
filename=f"joiner-epoch-{epoch}-avg-{avg}.onnx",
|
| 994 |
+
subfolder="exp",
|
| 995 |
+
)
|
| 996 |
+
|
| 997 |
+
tokens = _get_token_filename(repo_id=repo_id, subfolder="data/lang_char")
|
| 998 |
+
|
| 999 |
+
recognizer = sherpa_onnx.OfflineRecognizer.from_transducer(
|
| 1000 |
+
tokens=tokens,
|
| 1001 |
+
encoder=encoder_model,
|
| 1002 |
+
decoder=decoder_model,
|
| 1003 |
+
joiner=joiner_model,
|
| 1004 |
+
num_threads=2,
|
| 1005 |
+
sample_rate=16000,
|
| 1006 |
+
feature_dim=80,
|
| 1007 |
+
decoding_method=decoding_method,
|
| 1008 |
+
max_active_paths=num_active_paths,
|
| 1009 |
+
)
|
| 1010 |
+
|
| 1011 |
+
return recognizer
|
| 1012 |
+
|
| 1013 |
+
|
| 1014 |
def _get_multi_zh_hans_pre_trained_model(
|
| 1015 |
repo_id: str,
|
| 1016 |
decoding_method: str,
|
|
|
|
| 1057 |
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_zh_pre_trained_model,
|
| 1058 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
| 1059 |
"zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
|
| 1060 |
+
"zrjin/icefall-asr-aishell-zipformer-large-2023-10-24": _get_aishell_pre_trained_model, # noqa
|
| 1061 |
"desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7": _get_alimeeting_pre_trained_model,
|
| 1062 |
"yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12": _get_aishell2_pretrained_model, # noqa
|
| 1063 |
"yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12": _get_aishell2_pretrained_model, # noqa
|