Spaces:
Running
Running
update
Browse files- toolbox/k2_sherpa/examples.py +16 -0
- toolbox/k2_sherpa/nn_models.py +16 -5
toolbox/k2_sherpa/examples.py
CHANGED
@@ -43,6 +43,22 @@ examples = [
|
|
43 |
"Yes",
|
44 |
"./data/test_wavs/cantonese/1.wav",
|
45 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
46 |
[
|
47 |
"Tibetan",
|
48 |
"syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
|
|
|
43 |
"Yes",
|
44 |
"./data/test_wavs/cantonese/1.wav",
|
45 |
],
|
46 |
+
[
|
47 |
+
"German",
|
48 |
+
"csukuangfj/wav2vec2.0-torchaudio",
|
49 |
+
"greedy_search",
|
50 |
+
4,
|
51 |
+
"No",
|
52 |
+
"./data/test_wavs/german/20120315-0900-PLENARY-14-de_20120315.wav",
|
53 |
+
],
|
54 |
+
[
|
55 |
+
"German",
|
56 |
+
"csukuangfj/wav2vec2.0-torchaudio",
|
57 |
+
"greedy_search",
|
58 |
+
4,
|
59 |
+
"No",
|
60 |
+
"./data/test_wavs/german/20170517-0900-PLENARY-16-de_20170517.wav",
|
61 |
+
],
|
62 |
[
|
63 |
"Tibetan",
|
64 |
"syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
|
toolbox/k2_sherpa/nn_models.py
CHANGED
@@ -36,7 +36,7 @@ model_map = {
|
|
36 |
"nn_model_file_sub_folder": ".",
|
37 |
"tokens_file": "tokens.txt",
|
38 |
"tokens_file_sub_folder": ".",
|
39 |
-
"loader": "
|
40 |
},
|
41 |
{
|
42 |
"repo_id": "csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09",
|
@@ -44,7 +44,7 @@ model_map = {
|
|
44 |
"nn_model_file_sub_folder": ".",
|
45 |
"tokens_file": "tokens.txt",
|
46 |
"tokens_file_sub_folder": ".",
|
47 |
-
"loader": "
|
48 |
},
|
49 |
{
|
50 |
"repo_id": "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
|
@@ -186,7 +186,7 @@ model_map = {
|
|
186 |
"nn_model_file_sub_folder": ".",
|
187 |
"tokens_file": "tokens.txt",
|
188 |
"tokens_file_sub_folder": ".",
|
189 |
-
"loader": "
|
190 |
},
|
191 |
{
|
192 |
"repo_id": "yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17",
|
@@ -262,7 +262,7 @@ model_map = {
|
|
262 |
"nn_model_file_sub_folder": ".",
|
263 |
"tokens_file": "new_tokens.txt",
|
264 |
"tokens_file_sub_folder": ".",
|
265 |
-
"loader": "
|
266 |
},
|
267 |
{
|
268 |
"repo_id": "Zengwei/icefall-asr-librispeech-zipformer-large-2023-05-16",
|
@@ -340,7 +340,7 @@ model_map = {
|
|
340 |
"nn_model_file_sub_folder": ".",
|
341 |
"tokens_file": "tokens.txt",
|
342 |
"tokens_file_sub_folder": ".",
|
343 |
-
"loader": "
|
344 |
},
|
345 |
{
|
346 |
"repo_id": "ptrnull/icefall-asr-conv-emformer-transducer-stateless2-zh",
|
@@ -421,6 +421,17 @@ model_map = {
|
|
421 |
"loader": "load_sherpa_online_recognizer",
|
422 |
},
|
423 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
424 |
"Tibetan": [
|
425 |
{
|
426 |
"repo_id": "syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
|
|
|
36 |
"nn_model_file_sub_folder": ".",
|
37 |
"tokens_file": "tokens.txt",
|
38 |
"tokens_file_sub_folder": ".",
|
39 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
40 |
},
|
41 |
{
|
42 |
"repo_id": "csukuangfj/sherpa-onnx-paraformer-zh-small-2024-03-09",
|
|
|
44 |
"nn_model_file_sub_folder": ".",
|
45 |
"tokens_file": "tokens.txt",
|
46 |
"tokens_file_sub_folder": ".",
|
47 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
48 |
},
|
49 |
{
|
50 |
"repo_id": "luomingshuang/icefall_asr_wenetspeech_pruned_transducer_stateless2",
|
|
|
186 |
"nn_model_file_sub_folder": ".",
|
187 |
"tokens_file": "tokens.txt",
|
188 |
"tokens_file_sub_folder": ".",
|
189 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
190 |
},
|
191 |
{
|
192 |
"repo_id": "yfyeung/icefall-asr-gigaspeech-zipformer-2023-10-17",
|
|
|
262 |
"nn_model_file_sub_folder": ".",
|
263 |
"tokens_file": "new_tokens.txt",
|
264 |
"tokens_file_sub_folder": ".",
|
265 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
266 |
},
|
267 |
{
|
268 |
"repo_id": "Zengwei/icefall-asr-librispeech-zipformer-large-2023-05-16",
|
|
|
340 |
"nn_model_file_sub_folder": ".",
|
341 |
"tokens_file": "tokens.txt",
|
342 |
"tokens_file_sub_folder": ".",
|
343 |
+
"loader": "load_sherpa_onnx_offline_recognizer_from_paraformer",
|
344 |
},
|
345 |
{
|
346 |
"repo_id": "ptrnull/icefall-asr-conv-emformer-transducer-stateless2-zh",
|
|
|
421 |
"loader": "load_sherpa_online_recognizer",
|
422 |
},
|
423 |
],
|
424 |
+
"German": [
|
425 |
+
{
|
426 |
+
"repo_id": "csukuangfj/wav2vec2.0-torchaudio",
|
427 |
+
"nn_model_file": "voxpopuli_asr_base_10k_de.pt",
|
428 |
+
"nn_model_file_sub_folder": ".",
|
429 |
+
"tokens_file": "tokens-de.txt",
|
430 |
+
"tokens_file_sub_folder": ".",
|
431 |
+
"normalize_samples": False,
|
432 |
+
"loader": "load_sherpa_offline_recognizer",
|
433 |
+
},
|
434 |
+
],
|
435 |
"Tibetan": [
|
436 |
{
|
437 |
"repo_id": "syzym/icefall-asr-xbmu-amdo31-pruned-transducer-stateless7-2022-12-02",
|