csukuangfj commited on
Commit
697a4a4
1 Parent(s): 4366979

add more paraformer models

Browse files
Files changed (1) hide show
  1. model.py +10 -6
model.py CHANGED
@@ -930,11 +930,11 @@ def _get_gigaspeech_pre_trained_model_onnx(
930
 
931
 
932
  @lru_cache(maxsize=10)
933
- def _get_paraformer_zh_yue_en_pre_trained_model(
934
  repo_id: str,
935
  decoding_method: str,
936
  num_active_paths: int,
937
- ) -> sherpa_onnx.OfflineRecognizer:
938
  assert repo_id in [
939
  "csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en",
940
  ], repo_id
@@ -1000,13 +1000,14 @@ def _get_paraformer_en_pre_trained_model(
1000
 
1001
 
1002
  @lru_cache(maxsize=10)
1003
- def _get_paraformer_zh_pre_trained_model(
1004
  repo_id: str,
1005
  decoding_method: str,
1006
  num_active_paths: int,
1007
  ) -> sherpa_onnx.OfflineRecognizer:
1008
  assert repo_id in [
1009
  "csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28",
 
1010
  ], repo_id
1011
 
1012
  nn_model = _get_nn_model_filename(
@@ -1128,7 +1129,9 @@ def _get_multi_zh_hans_pre_trained_model(
1128
 
1129
 
1130
  chinese_models = {
1131
- "csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_zh_pre_trained_model,
 
 
1132
  "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
1133
  "zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
1134
  "zrjin/icefall-asr-aishell-zipformer-large-2023-10-24": _get_aishell_pre_trained_model, # noqa
@@ -1148,6 +1151,7 @@ english_models = {
1148
  "whisper-base.en": _get_whisper_model,
1149
  "whisper-small.en": _get_whisper_model,
1150
  # "whisper-medium.en": _get_whisper_model,
 
1151
  "yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17": _get_gigaspeech_pre_trained_model_onnx, # noqa
1152
  "wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2": _get_gigaspeech_pre_trained_model, # noqa
1153
  "yfyeung/icefall-asr-multidataset-pruned_transducer_stateless7-2023-05-04": _get_english_model, # noqa
@@ -1199,8 +1203,8 @@ russian_models = {
1199
  }
1200
 
1201
  chinese_cantonese_english_models = {
1202
- "csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en": _get_paraformer_zh_yue_en_pre_trained_model,
1203
- # "csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en": _get_paraformer_en_pre_trained_model,
1204
  }
1205
 
1206
 
 
930
 
931
 
932
  @lru_cache(maxsize=10)
933
+ def _get_streaming_paraformer_zh_yue_en_pre_trained_model(
934
  repo_id: str,
935
  decoding_method: str,
936
  num_active_paths: int,
937
+ ) -> sherpa_onnx.OnlineRecognizer:
938
  assert repo_id in [
939
  "csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en",
940
  ], repo_id
 
1000
 
1001
 
1002
  @lru_cache(maxsize=10)
1003
+ def _get_paraformer_pre_trained_model(
1004
  repo_id: str,
1005
  decoding_method: str,
1006
  num_active_paths: int,
1007
  ) -> sherpa_onnx.OfflineRecognizer:
1008
  assert repo_id in [
1009
  "csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28",
1010
+ "csukuangfj/sherpa-onnx-paraformer-trilingual-zh-cantonese-en",
1011
  ], repo_id
1012
 
1013
  nn_model = _get_nn_model_filename(
 
1129
 
1130
 
1131
  chinese_models = {
1132
+ "csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_pre_trained_model,
1133
+ "csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09": _get_paraformer_pre_trained_model,
1134
+ "csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09": _get_paraformer_pre_trained_model,
1135
  "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
1136
  "zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
1137
  "zrjin/icefall-asr-aishell-zipformer-large-2023-10-24": _get_aishell_pre_trained_model, # noqa
 
1151
  "whisper-base.en": _get_whisper_model,
1152
  "whisper-small.en": _get_whisper_model,
1153
  # "whisper-medium.en": _get_whisper_model,
1154
+ "csukuangfj/sherpa-onnx-paraformer-en-small-2024-03-09": _get_paraformer_pre_trained_model,
1155
  "yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17": _get_gigaspeech_pre_trained_model_onnx, # noqa
1156
  "wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2": _get_gigaspeech_pre_trained_model, # noqa
1157
  "yfyeung/icefall-asr-multidataset-pruned_transducer_stateless7-2023-05-04": _get_english_model, # noqa
 
1203
  }
1204
 
1205
  chinese_cantonese_english_models = {
1206
+ "csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en": _get_streaming_paraformer_zh_yue_en_pre_trained_model,
1207
+ "csukuangfj/sherpa-onnx-paraformer-trilingual-zh-cantonese-en": _get_paraformer_pre_trained_model,
1208
  }
1209
 
1210