Spaces:
Build error
Build error
Commit
·
24c2ef7
1
Parent(s):
8b52167
add korean
Browse files- examples.py +32 -0
- model.py +11 -0
- test_wavs/korean/0.wav +0 -0
- test_wavs/korean/1.wav +0 -0
- test_wavs/korean/2.wav +0 -0
- test_wavs/korean/3.wav +0 -0
examples.py
CHANGED
|
@@ -56,6 +56,14 @@ examples = [
|
|
| 56 |
"Yes",
|
| 57 |
"./test_wavs/paraformer-zh/四川话.wav",
|
| 58 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 59 |
[
|
| 60 |
"Russian",
|
| 61 |
"alphacep/vosk-model-ru",
|
|
@@ -405,4 +413,28 @@ examples = [
|
|
| 405 |
"No",
|
| 406 |
"./test_wavs/french/common_voice_fr_27024649.wav",
|
| 407 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 408 |
]
|
|
|
|
| 56 |
"Yes",
|
| 57 |
"./test_wavs/paraformer-zh/四川话.wav",
|
| 58 |
],
|
| 59 |
+
[
|
| 60 |
+
"Korean",
|
| 61 |
+
"k2-fsa/sherpa-onnx-streaming-zipformer-korean-2024-06-16",
|
| 62 |
+
"greedy_search",
|
| 63 |
+
4,
|
| 64 |
+
"No",
|
| 65 |
+
"./test_wavs/korean/0.wav",
|
| 66 |
+
],
|
| 67 |
[
|
| 68 |
"Russian",
|
| 69 |
"alphacep/vosk-model-ru",
|
|
|
|
| 413 |
"No",
|
| 414 |
"./test_wavs/french/common_voice_fr_27024649.wav",
|
| 415 |
],
|
| 416 |
+
[
|
| 417 |
+
"Korean",
|
| 418 |
+
"k2-fsa/sherpa-onnx-streaming-zipformer-korean-2024-06-16",
|
| 419 |
+
"greedy_search",
|
| 420 |
+
4,
|
| 421 |
+
"No",
|
| 422 |
+
"./test_wavs/korean/1.wav",
|
| 423 |
+
],
|
| 424 |
+
[
|
| 425 |
+
"Korean",
|
| 426 |
+
"k2-fsa/sherpa-onnx-streaming-zipformer-korean-2024-06-16",
|
| 427 |
+
"greedy_search",
|
| 428 |
+
4,
|
| 429 |
+
"No",
|
| 430 |
+
"./test_wavs/korean/2.wav",
|
| 431 |
+
],
|
| 432 |
+
[
|
| 433 |
+
"Korean",
|
| 434 |
+
"k2-fsa/sherpa-onnx-streaming-zipformer-korean-2024-06-16",
|
| 435 |
+
"greedy_search",
|
| 436 |
+
4,
|
| 437 |
+
"No",
|
| 438 |
+
"./test_wavs/korean/3.wav",
|
| 439 |
+
],
|
| 440 |
]
|
model.py
CHANGED
|
@@ -208,6 +208,10 @@ def get_pretrained_model(
|
|
| 208 |
return russian_models[repo_id](
|
| 209 |
repo_id, decoding_method=decoding_method, num_active_paths=num_active_paths
|
| 210 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
| 211 |
else:
|
| 212 |
raise ValueError(f"Unsupported repo_id: {repo_id}")
|
| 213 |
|
|
@@ -894,6 +898,7 @@ def _get_streaming_zipformer_pre_trained_model(
|
|
| 894 |
) -> sherpa_onnx.OnlineRecognizer:
|
| 895 |
assert repo_id in [
|
| 896 |
"csukuangfj/sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20",
|
|
|
|
| 897 |
], repo_id
|
| 898 |
|
| 899 |
encoder_model = _get_nn_model_filename(
|
|
@@ -1356,6 +1361,10 @@ cantonese_models = {
|
|
| 1356 |
"zrjin/icefall-asr-mdcc-zipformer-2024-03-11": _get_zrjin_cantonese_pre_trained_model,
|
| 1357 |
}
|
| 1358 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1359 |
|
| 1360 |
all_models = {
|
| 1361 |
**chinese_models,
|
|
@@ -1369,6 +1378,7 @@ all_models = {
|
|
| 1369 |
**german_models,
|
| 1370 |
**french_models,
|
| 1371 |
**russian_models,
|
|
|
|
| 1372 |
}
|
| 1373 |
|
| 1374 |
language_to_models = {
|
|
@@ -1384,4 +1394,5 @@ language_to_models = {
|
|
| 1384 |
"German": list(german_models.keys()),
|
| 1385 |
"French": list(french_models.keys()),
|
| 1386 |
"Russian": list(russian_models.keys()),
|
|
|
|
| 1387 |
}
|
|
|
|
| 208 |
return russian_models[repo_id](
|
| 209 |
repo_id, decoding_method=decoding_method, num_active_paths=num_active_paths
|
| 210 |
)
|
| 211 |
+
elif repo_id in korean_models:
|
| 212 |
+
return korean_models[repo_id](
|
| 213 |
+
repo_id, decoding_method=decoding_method, num_active_paths=num_active_paths
|
| 214 |
+
)
|
| 215 |
else:
|
| 216 |
raise ValueError(f"Unsupported repo_id: {repo_id}")
|
| 217 |
|
|
|
|
| 898 |
) -> sherpa_onnx.OnlineRecognizer:
|
| 899 |
assert repo_id in [
|
| 900 |
"csukuangfj/sherpa-onnx-streaming-zipformer-bilingual-zh-en-2023-02-20",
|
| 901 |
+
"k2-fsa/sherpa-onnx-streaming-zipformer-korean-2024-06-16",
|
| 902 |
], repo_id
|
| 903 |
|
| 904 |
encoder_model = _get_nn_model_filename(
|
|
|
|
| 1361 |
"zrjin/icefall-asr-mdcc-zipformer-2024-03-11": _get_zrjin_cantonese_pre_trained_model,
|
| 1362 |
}
|
| 1363 |
|
| 1364 |
+
korean_models = {
|
| 1365 |
+
"k2-fsa/sherpa-onnx-streaming-zipformer-korean-2024-06-16": _get_streaming_zipformer_pre_trained_model,
|
| 1366 |
+
}
|
| 1367 |
+
|
| 1368 |
|
| 1369 |
all_models = {
|
| 1370 |
**chinese_models,
|
|
|
|
| 1378 |
**german_models,
|
| 1379 |
**french_models,
|
| 1380 |
**russian_models,
|
| 1381 |
+
**korean_models,
|
| 1382 |
}
|
| 1383 |
|
| 1384 |
language_to_models = {
|
|
|
|
| 1394 |
"German": list(german_models.keys()),
|
| 1395 |
"French": list(french_models.keys()),
|
| 1396 |
"Russian": list(russian_models.keys()),
|
| 1397 |
+
"Korean": list(korean_models.keys()),
|
| 1398 |
}
|
test_wavs/korean/0.wav
ADDED
|
Binary file (113 kB). View file
|
|
|
test_wavs/korean/1.wav
ADDED
|
Binary file (109 kB). View file
|
|
|
test_wavs/korean/2.wav
ADDED
|
Binary file (212 kB). View file
|
|
|
test_wavs/korean/3.wav
ADDED
|
Binary file (85.8 kB). View file
|
|
|