Spaces:
Build error
Build error
Commit
·
697a4a4
1
Parent(s):
4366979
add more paraformer models
Browse files
model.py
CHANGED
|
@@ -930,11 +930,11 @@ def _get_gigaspeech_pre_trained_model_onnx(
|
|
| 930 |
|
| 931 |
|
| 932 |
@lru_cache(maxsize=10)
|
| 933 |
-
def
|
| 934 |
repo_id: str,
|
| 935 |
decoding_method: str,
|
| 936 |
num_active_paths: int,
|
| 937 |
-
) -> sherpa_onnx.
|
| 938 |
assert repo_id in [
|
| 939 |
"csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en",
|
| 940 |
], repo_id
|
|
@@ -1000,13 +1000,14 @@ def _get_paraformer_en_pre_trained_model(
|
|
| 1000 |
|
| 1001 |
|
| 1002 |
@lru_cache(maxsize=10)
|
| 1003 |
-
def
|
| 1004 |
repo_id: str,
|
| 1005 |
decoding_method: str,
|
| 1006 |
num_active_paths: int,
|
| 1007 |
) -> sherpa_onnx.OfflineRecognizer:
|
| 1008 |
assert repo_id in [
|
| 1009 |
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28",
|
|
|
|
| 1010 |
], repo_id
|
| 1011 |
|
| 1012 |
nn_model = _get_nn_model_filename(
|
|
@@ -1128,7 +1129,9 @@ def _get_multi_zh_hans_pre_trained_model(
|
|
| 1128 |
|
| 1129 |
|
| 1130 |
chinese_models = {
|
| 1131 |
-
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28":
|
|
|
|
|
|
|
| 1132 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
| 1133 |
"zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
|
| 1134 |
"zrjin/icefall-asr-aishell-zipformer-large-2023-10-24": _get_aishell_pre_trained_model, # noqa
|
|
@@ -1148,6 +1151,7 @@ english_models = {
|
|
| 1148 |
"whisper-base.en": _get_whisper_model,
|
| 1149 |
"whisper-small.en": _get_whisper_model,
|
| 1150 |
# "whisper-medium.en": _get_whisper_model,
|
|
|
|
| 1151 |
"yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17": _get_gigaspeech_pre_trained_model_onnx, # noqa
|
| 1152 |
"wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2": _get_gigaspeech_pre_trained_model, # noqa
|
| 1153 |
"yfyeung/icefall-asr-multidataset-pruned_transducer_stateless7-2023-05-04": _get_english_model, # noqa
|
|
@@ -1199,8 +1203,8 @@ russian_models = {
|
|
| 1199 |
}
|
| 1200 |
|
| 1201 |
chinese_cantonese_english_models = {
|
| 1202 |
-
"csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en":
|
| 1203 |
-
|
| 1204 |
}
|
| 1205 |
|
| 1206 |
|
|
|
|
| 930 |
|
| 931 |
|
| 932 |
@lru_cache(maxsize=10)
|
| 933 |
+
def _get_streaming_paraformer_zh_yue_en_pre_trained_model(
|
| 934 |
repo_id: str,
|
| 935 |
decoding_method: str,
|
| 936 |
num_active_paths: int,
|
| 937 |
+
) -> sherpa_onnx.OnlineRecognizer:
|
| 938 |
assert repo_id in [
|
| 939 |
"csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en",
|
| 940 |
], repo_id
|
|
|
|
| 1000 |
|
| 1001 |
|
| 1002 |
@lru_cache(maxsize=10)
|
| 1003 |
+
def _get_paraformer_pre_trained_model(
|
| 1004 |
repo_id: str,
|
| 1005 |
decoding_method: str,
|
| 1006 |
num_active_paths: int,
|
| 1007 |
) -> sherpa_onnx.OfflineRecognizer:
|
| 1008 |
assert repo_id in [
|
| 1009 |
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28",
|
| 1010 |
+
"csukuangfj/sherpa-onnx-paraformer-trilingual-zh-cantonese-en",
|
| 1011 |
], repo_id
|
| 1012 |
|
| 1013 |
nn_model = _get_nn_model_filename(
|
|
|
|
| 1129 |
|
| 1130 |
|
| 1131 |
chinese_models = {
|
| 1132 |
+
"csukuangfj/sherpa-onnx-paraformer-zh-2023-03-28": _get_paraformer_pre_trained_model,
|
| 1133 |
+
"csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09": _get_paraformer_pre_trained_model,
|
| 1134 |
+
"csukuangfj/sherpa-onnx-paraformer-zh-2024-03-09": _get_paraformer_pre_trained_model,
|
| 1135 |
"luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2": _get_wenetspeech_pre_trained_model, # noqa
|
| 1136 |
"zrjin/sherpa-onnx-zipformer-multi-zh-hans-2023-9-2": _get_multi_zh_hans_pre_trained_model, # noqa
|
| 1137 |
"zrjin/icefall-asr-aishell-zipformer-large-2023-10-24": _get_aishell_pre_trained_model, # noqa
|
|
|
|
| 1151 |
"whisper-base.en": _get_whisper_model,
|
| 1152 |
"whisper-small.en": _get_whisper_model,
|
| 1153 |
# "whisper-medium.en": _get_whisper_model,
|
| 1154 |
+
"csukuangfj/sherpa-onnx-paraformer-en-small-2024-03-09": _get_paraformer_pre_trained_model,
|
| 1155 |
"yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17": _get_gigaspeech_pre_trained_model_onnx, # noqa
|
| 1156 |
"wgb14/icefall-asr-gigaspeech-pruned-transducer-stateless2": _get_gigaspeech_pre_trained_model, # noqa
|
| 1157 |
"yfyeung/icefall-asr-multidataset-pruned_transducer_stateless7-2023-05-04": _get_english_model, # noqa
|
|
|
|
| 1203 |
}
|
| 1204 |
|
| 1205 |
chinese_cantonese_english_models = {
|
| 1206 |
+
"csukuangfj/sherpa-onnx-streaming-paraformer-trilingual-zh-cantonese-en": _get_streaming_paraformer_zh_yue_en_pre_trained_model,
|
| 1207 |
+
"csukuangfj/sherpa-onnx-paraformer-trilingual-zh-cantonese-en": _get_paraformer_pre_trained_model,
|
| 1208 |
}
|
| 1209 |
|
| 1210 |
|