csukuangfj commited on
Commit
74a5c18
·
1 Parent(s): 4e478c6

update models

Browse files
Files changed (1) hide show
  1. model.py +56 -0
model.py CHANGED
@@ -956,6 +956,61 @@ def _get_paraformer_zh_pre_trained_model(
956
  return recognizer
957
 
958
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
959
  def _get_multi_zh_hans_pre_trained_model(
960
  repo_id: str,
961
  decoding_method: str,
@@ -1002,6 +1057,7 @@ chinese_models = {
1002
  "csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_zh_pre_trained_model,
1003
  "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
1004
  "zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
 
1005
  "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7": _get_alimeeting_pre_trained_model,
1006
  "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12": _get_aishell2_pretrained_model, # noqa
1007
  "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12": _get_aishell2_pretrained_model, # noqa
 
956
  return recognizer
957
 
958
 
959
+ def _get_aishell_pre_trained_model(
960
+ repo_id: str,
961
+ decoding_method: str,
962
+ num_active_paths: int,
963
+ ) -> sherpa_onnx.OfflineRecognizer:
964
+ assert repo_id in (
965
+ "zrjin/icefall-asr-aishell-zipformer-large-2023-10-24",
966
+ "zrjin/icefall-asr-aishell-zipformer-small-2023-10-24",
967
+ "zrjin/icefall-asr-aishell-zipformer-2023-10-24",
968
+ ), repo_id
969
+ if repo_id == "zrjin/icefall-asr-aishell-zipformer-large-2023-10-24":
970
+ epoch = 56
971
+ avg = 23
972
+ elif repo_id == "zrjin/icefall-asr-aishell-zipformer-small-2023-10-24":
973
+ epoch = 55
974
+ avg = 21
975
+ elif repo_id == "zrjin/icefall-asr-aishell-zipformer-2023-10-24":
976
+ epoch = 55
977
+ avg = 17
978
+
979
+ encoder_model = _get_nn_model_filename(
980
+ repo_id=repo_id,
981
+ filename=f"encoder-epoch-{epoch}-avg-{avg}.onnx",
982
+ subfolder="exp",
983
+ )
984
+
985
+ decoder_model = _get_nn_model_filename(
986
+ repo_id=repo_id,
987
+ filename=f"decoder-epoch-{epoch}-avg-{avg}.onnx",
988
+ subfolder="exp",
989
+ )
990
+
991
+ joiner_model = _get_nn_model_filename(
992
+ repo_id=repo_id,
993
+ filename=f"joiner-epoch-{epoch}-avg-{avg}.onnx",
994
+ subfolder="exp",
995
+ )
996
+
997
+ tokens = _get_token_filename(repo_id=repo_id, subfolder="data/lang_char")
998
+
999
+ recognizer = sherpa_onnx.OfflineRecognizer.from_transducer(
1000
+ tokens=tokens,
1001
+ encoder=encoder_model,
1002
+ decoder=decoder_model,
1003
+ joiner=joiner_model,
1004
+ num_threads=2,
1005
+ sample_rate=16000,
1006
+ feature_dim=80,
1007
+ decoding_method=decoding_method,
1008
+ max_active_paths=num_active_paths,
1009
+ )
1010
+
1011
+ return recognizer
1012
+
1013
+
1014
  def _get_multi_zh_hans_pre_trained_model(
1015
  repo_id: str,
1016
  decoding_method: str,
 
1057
  "csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_zh_pre_trained_model,
1058
  "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
1059
  "zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
1060
+ "zrjin/icefall-asr-aishell-zipformer-large-2023-10-24": _get_aishell_pre_trained_model, # noqa
1061
  "desh2608/icefall-asr-alimeeting-pruned-transducer-stateless7": _get_alimeeting_pre_trained_model,
1062
  "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-A-2022-07-12": _get_aishell2_pretrained_model, # noqa
1063
  "yuekai/icefall-asr-aishell2-pruned-transducer-stateless5-B-2022-07-12": _get_aishell2_pretrained_model, # noqa