Commit
·
e618c84
1
Parent(s):
c342af5
add a new model
Browse files
model.py
CHANGED
@@ -911,9 +911,52 @@ def _get_paraformer_zh_pre_trained_model(
|
|
911 |
return recognizer
|
912 |
|
913 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
914 |
chinese_models = {
|
915 |
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_zh_pre_trained_model,
|
916 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
|
|
917 |
"desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7": _get_alimeeting_pre_trained_model,
|
918 |
"yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12": _get_aishell2_pretrained_model, # noqa
|
919 |
"yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12": _get_aishell2_pretrained_model, # noqa
|
|
|
911 |
return recognizer
|
912 |
|
913 |
|
914 |
+
def _get_multi_zh_hans_pre_trained_model(
|
915 |
+
repo_id: str,
|
916 |
+
decoding_method: str,
|
917 |
+
num_active_paths: int,
|
918 |
+
) -> sherpa_onnx.OfflineRecognizer:
|
919 |
+
assert repo_id in ("zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2",), repo_id
|
920 |
+
|
921 |
+
encoder_model = _get_nn_model_filename(
|
922 |
+
repo_id=repo_id,
|
923 |
+
filename="encoder-epoch-20-avg-1.onnx",
|
924 |
+
subfolder=".",
|
925 |
+
)
|
926 |
+
|
927 |
+
decoder_model = _get_nn_model_filename(
|
928 |
+
repo_id=repo_id,
|
929 |
+
filename="decoder-epoch-20-avg-1.onnx",
|
930 |
+
subfolder=".",
|
931 |
+
)
|
932 |
+
|
933 |
+
joiner_model = _get_nn_model_filename(
|
934 |
+
repo_id=repo_id,
|
935 |
+
filename="joiner-epoch-20-avg-1.onnx",
|
936 |
+
subfolder=".",
|
937 |
+
)
|
938 |
+
|
939 |
+
tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
|
940 |
+
|
941 |
+
recognizer = sherpa_onnx.OfflineRecognizer.from_transducer(
|
942 |
+
tokens=tokens,
|
943 |
+
encoder=encoder_model,
|
944 |
+
decoder=decoder_model,
|
945 |
+
joiner=joiner_model,
|
946 |
+
num_threads=2,
|
947 |
+
sample_rate=16000,
|
948 |
+
feature_dim=80,
|
949 |
+
decoding_method=decoding_method,
|
950 |
+
num_active_paths=num_active_paths,
|
951 |
+
)
|
952 |
+
|
953 |
+
return recognizer
|
954 |
+
|
955 |
+
|
956 |
chinese_models = {
|
957 |
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_zh_pre_trained_model,
|
958 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
959 |
+
"zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
|
960 |
"desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7": _get_alimeeting_pre_trained_model,
|
961 |
"yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12": _get_aishell2_pretrained_model, # noqa
|
962 |
"yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12": _get_aishell2_pretrained_model, # noqa
|