Spaces:
Sleeping
Sleeping
update
Browse files- toolbox/k2_sherpa/examples.py +16 -0
- toolbox/k2_sherpa/nn_models.py +16 -5
toolbox/k2_sherpa/examples.py
CHANGED
|
@@ -43,6 +43,22 @@ examples = [
|
|
| 43 |
"Yes",
|
| 44 |
"./data/test_wavs/cantonese/1.wav",
|
| 45 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 46 |
[
|
| 47 |
"Tibetan",
|
| 48 |
"syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
|
|
|
|
| 43 |
"Yes",
|
| 44 |
"./data/test_wavs/cantonese/1.wav",
|
| 45 |
],
|
| 46 |
+
[
|
| 47 |
+
"German",
|
| 48 |
+
"csukuangfj/wav2vec2.0-torchaudio",
|
| 49 |
+
"greedy_search",
|
| 50 |
+
4,
|
| 51 |
+
"No",
|
| 52 |
+
"./data/test_wavs/german/20120315-0900-PLENARY-14-de_20120315.wav",
|
| 53 |
+
],
|
| 54 |
+
[
|
| 55 |
+
"German",
|
| 56 |
+
"csukuangfj/wav2vec2.0-torchaudio",
|
| 57 |
+
"greedy_search",
|
| 58 |
+
4,
|
| 59 |
+
"No",
|
| 60 |
+
"./data/test_wavs/german/20170517-0900-PLENARY-16-de_20170517.wav",
|
| 61 |
+
],
|
| 62 |
[
|
| 63 |
"Tibetan",
|
| 64 |
"syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
|
toolbox/k2_sherpa/nn_models.py
CHANGED
|
@@ -36,7 +36,7 @@ model_map = {
|
|
| 36 |
"nn_model_file_sub_folder": ".",
|
| 37 |
"tokens_file": "tokens.txt",
|
| 38 |
"tokens_file_sub_folder": ".",
|
| 39 |
-
"loader": "
|
| 40 |
},
|
| 41 |
{
|
| 42 |
"repo_id": "csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09",
|
|
@@ -44,7 +44,7 @@ model_map = {
|
|
| 44 |
"nn_model_file_sub_folder": ".",
|
| 45 |
"tokens_file": "tokens.txt",
|
| 46 |
"tokens_file_sub_folder": ".",
|
| 47 |
-
"loader": "
|
| 48 |
},
|
| 49 |
{
|
| 50 |
"repo_id": "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
|
|
@@ -186,7 +186,7 @@ model_map = {
|
|
| 186 |
"nn_model_file_sub_folder": ".",
|
| 187 |
"tokens_file": "tokens.txt",
|
| 188 |
"tokens_file_sub_folder": ".",
|
| 189 |
-
"loader": "
|
| 190 |
},
|
| 191 |
{
|
| 192 |
"repo_id": "yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17",
|
|
@@ -262,7 +262,7 @@ model_map = {
|
|
| 262 |
"nn_model_file_sub_folder": ".",
|
| 263 |
"tokens_file": "new_tokens.txt",
|
| 264 |
"tokens_file_sub_folder": ".",
|
| 265 |
-
"loader": "
|
| 266 |
},
|
| 267 |
{
|
| 268 |
"repo_id": "Zengwei/icefall-asr-librispeech-zipformer-large-2023-05-16",
|
|
@@ -340,7 +340,7 @@ model_map = {
|
|
| 340 |
"nn_model_file_sub_folder": ".",
|
| 341 |
"tokens_file": "tokens.txt",
|
| 342 |
"tokens_file_sub_folder": ".",
|
| 343 |
-
"loader": "
|
| 344 |
},
|
| 345 |
{
|
| 346 |
"repo_id": "ptrnull/icefall-asr-conv-emformer-transducer-stateless2-zh",
|
|
@@ -421,6 +421,17 @@ model_map = {
|
|
| 421 |
"loader": "load_sherpa_online_recognizer",
|
| 422 |
},
|
| 423 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 424 |
"Tibetan": [
|
| 425 |
{
|
| 426 |
"repo_id": "syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
|
|
|
|
| 36 |
"nn_model_file_sub_folder": ".",
|
| 37 |
"tokens_file": "tokens.txt",
|
| 38 |
"tokens_file_sub_folder": ".",
|
| 39 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
| 40 |
},
|
| 41 |
{
|
| 42 |
"repo_id": "csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09",
|
|
|
|
| 44 |
"nn_model_file_sub_folder": ".",
|
| 45 |
"tokens_file": "tokens.txt",
|
| 46 |
"tokens_file_sub_folder": ".",
|
| 47 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
| 48 |
},
|
| 49 |
{
|
| 50 |
"repo_id": "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
|
|
|
|
| 186 |
"nn_model_file_sub_folder": ".",
|
| 187 |
"tokens_file": "tokens.txt",
|
| 188 |
"tokens_file_sub_folder": ".",
|
| 189 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
| 190 |
},
|
| 191 |
{
|
| 192 |
"repo_id": "yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17",
|
|
|
|
| 262 |
"nn_model_file_sub_folder": ".",
|
| 263 |
"tokens_file": "new_tokens.txt",
|
| 264 |
"tokens_file_sub_folder": ".",
|
| 265 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
| 266 |
},
|
| 267 |
{
|
| 268 |
"repo_id": "Zengwei/icefall-asr-librispeech-zipformer-large-2023-05-16",
|
|
|
|
| 340 |
"nn_model_file_sub_folder": ".",
|
| 341 |
"tokens_file": "tokens.txt",
|
| 342 |
"tokens_file_sub_folder": ".",
|
| 343 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
| 344 |
},
|
| 345 |
{
|
| 346 |
"repo_id": "ptrnull/icefall-asr-conv-emformer-transducer-stateless2-zh",
|
|
|
|
| 421 |
"loader": "load_sherpa_online_recognizer",
|
| 422 |
},
|
| 423 |
],
|
| 424 |
+
"German": [
|
| 425 |
+
{
|
| 426 |
+
"repo_id": "csukuangfj/wav2vec2.0-torchaudio",
|
| 427 |
+
"nn_model_file": "voxpopuli_asr_base_10k_de.pt",
|
| 428 |
+
"nn_model_file_sub_folder": ".",
|
| 429 |
+
"tokens_file": "tokens-de.txt",
|
| 430 |
+
"tokens_file_sub_folder": ".",
|
| 431 |
+
"normalize_samples": False,
|
| 432 |
+
"loader": "load_sherpa_offline_recognizer",
|
| 433 |
+
},
|
| 434 |
+
],
|
| 435 |
"Tibetan": [
|
| 436 |
{
|
| 437 |
"repo_id": "syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
|