csukuangfj
commited on
Commit
·
697a4a4
1
Parent(s):
4366979
add more paraformer models
Browse files
model.py
CHANGED
@@ -930,11 +930,11 @@ def _get_gigaspeech_pre_trained_model_onnx(
|
|
930 |
|
931 |
|
932 |
@lru_cache(maxsize=10)
|
933 |
-
def
|
934 |
repo_id: str,
|
935 |
decoding_method: str,
|
936 |
num_active_paths: int,
|
937 |
-
) -> sherpa_onnx.
|
938 |
assert repo_id in [
|
939 |
"csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en",
|
940 |
], repo_id
|
@@ -1000,13 +1000,14 @@ def _get_paraformer_en_pre_trained_model(
|
|
1000 |
|
1001 |
|
1002 |
@lru_cache(maxsize=10)
|
1003 |
-
def
|
1004 |
repo_id: str,
|
1005 |
decoding_method: str,
|
1006 |
num_active_paths: int,
|
1007 |
) -> sherpa_onnx.OfflineRecognizer:
|
1008 |
assert repo_id in [
|
1009 |
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28",
|
|
|
1010 |
], repo_id
|
1011 |
|
1012 |
nn_model = _get_nn_model_filename(
|
@@ -1128,7 +1129,9 @@ def _get_multi_zh_hans_pre_trained_model(
|
|
1128 |
|
1129 |
|
1130 |
chinese_models = {
|
1131 |
-
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28":
|
|
|
|
|
1132 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
1133 |
"zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
|
1134 |
"zrjin/icefall-asr-aishell-zipformer-large-2023-10-24": _get_aishell_pre_trained_model, # noqa
|
@@ -1148,6 +1151,7 @@ english_models = {
|
|
1148 |
"whisper-base.en": _get_whisper_model,
|
1149 |
"whisper-small.en": _get_whisper_model,
|
1150 |
# "whisper-medium.en": _get_whisper_model,
|
|
|
1151 |
"yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17": _get_gigaspeech_pre_trained_model_onnx, # noqa
|
1152 |
"wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2": _get_gigaspeech_pre_trained_model, # noqa
|
1153 |
"yfyeung/icefall-asr-multidataset-pruned_transducer_stateless7-2023-05-04": _get_english_model, # noqa
|
@@ -1199,8 +1203,8 @@ russian_models = {
|
|
1199 |
}
|
1200 |
|
1201 |
chinese_cantonese_english_models = {
|
1202 |
-
"csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en":
|
1203 |
-
|
1204 |
}
|
1205 |
|
1206 |
|
|
|
930 |
|
931 |
|
932 |
@lru_cache(maxsize=10)
|
933 |
+
def _get_streaming_paraformer_zh_yue_en_pre_trained_model(
|
934 |
repo_id: str,
|
935 |
decoding_method: str,
|
936 |
num_active_paths: int,
|
937 |
+
) -> sherpa_onnx.OnlineRecognizer:
|
938 |
assert repo_id in [
|
939 |
"csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en",
|
940 |
], repo_id
|
|
|
1000 |
|
1001 |
|
1002 |
@lru_cache(maxsize=10)
|
1003 |
+
def _get_paraformer_pre_trained_model(
|
1004 |
repo_id: str,
|
1005 |
decoding_method: str,
|
1006 |
num_active_paths: int,
|
1007 |
) -> sherpa_onnx.OfflineRecognizer:
|
1008 |
assert repo_id in [
|
1009 |
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28",
|
1010 |
+
"csukuangfj/sherpa-onnx-paraformer-trilingual-zh-cantonese-en",
|
1011 |
], repo_id
|
1012 |
|
1013 |
nn_model = _get_nn_model_filename(
|
|
|
1129 |
|
1130 |
|
1131 |
chinese_models = {
|
1132 |
+
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_pre_trained_model,
|
1133 |
+
"csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09": _get_paraformer_pre_trained_model,
|
1134 |
+
"csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09": _get_paraformer_pre_trained_model,
|
1135 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
1136 |
"zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
|
1137 |
"zrjin/icefall-asr-aishell-zipformer-large-2023-10-24": _get_aishell_pre_trained_model, # noqa
|
|
|
1151 |
"whisper-base.en": _get_whisper_model,
|
1152 |
"whisper-small.en": _get_whisper_model,
|
1153 |
# "whisper-medium.en": _get_whisper_model,
|
1154 |
+
"csukuangfj/sherpa-onnx-paraformer-en-small-2024-03-09": _get_paraformer_pre_trained_model,
|
1155 |
"yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17": _get_gigaspeech_pre_trained_model_onnx, # noqa
|
1156 |
"wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2": _get_gigaspeech_pre_trained_model, # noqa
|
1157 |
"yfyeung/icefall-asr-multidataset-pruned_transducer_stateless7-2023-05-04": _get_english_model, # noqa
|
|
|
1203 |
}
|
1204 |
|
1205 |
chinese_cantonese_english_models = {
|
1206 |
+
"csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en": _get_streaming_paraformer_zh_yue_en_pre_trained_model,
|
1207 |
+
"csukuangfj/sherpa-onnx-paraformer-trilingual-zh-cantonese-en": _get_paraformer_pre_trained_model,
|
1208 |
}
|
1209 |
|
1210 |
|