csukuangfj commited on
Commit
387e4e6
·
1 Parent(s): 320f57c

add more models

Browse files
Files changed (1) hide show
  1. model.py +18 -0
model.py CHANGED
@@ -170,6 +170,10 @@ def get_pretrained_model(
170
  return multi_lingual_models[repo_id](
171
  repo_id, decoding_method=decoding_method, num_active_paths=num_active_paths
172
  )
 
 
 
 
173
  elif repo_id in chinese_models:
174
  return chinese_models[repo_id](
175
  repo_id, decoding_method=decoding_method, num_active_paths=num_active_paths
@@ -1594,12 +1598,14 @@ def _get_streaming_zipformer_pre_trained_model(
1594
  "csukuangfj/sherpa-onnx-streaming-zipformer-en-kroko-2025-08-06",
1595
  "csukuangfj/sherpa-onnx-streaming-zipformer-es-kroko-2025-08-06",
1596
  "csukuangfj/sherpa-onnx-streaming-zipformer-fr-kroko-2025-08-06",
 
1597
  ], repo_id
1598
 
1599
  if repo_id in [
1600
  "csukuangfj/sherpa-onnx-streaming-zipformer-en-kroko-2025-08-06",
1601
  "csukuangfj/sherpa-onnx-streaming-zipformer-es-kroko-2025-08-06",
1602
  "csukuangfj/sherpa-onnx-streaming-zipformer-fr-kroko-2025-08-06",
 
1603
  ]:
1604
  encoder_model = _get_nn_model_filename(
1605
  repo_id=repo_id,
@@ -2089,6 +2095,10 @@ english_models = {
2089
  "csukuangfj/wenet-english-model": _get_wenet_model,
2090
  }
2091
 
 
 
 
 
2092
  multi_lingual_models = {
2093
  "csukuangfj/sherpa-onnx-dolphin-base-ctc-multi-lang-int8-2025-04-02": _get_dolphin_ctc_models,
2094
  "csukuangfj/sherpa-onnx-dolphin-small-ctc-multi-lang-int8-2025-04-02": _get_dolphin_ctc_models,
@@ -2115,6 +2125,8 @@ arabic_models = {
2115
  }
2116
 
2117
  german_models = {
 
 
2118
  "csukuangfj/sherpa-onnx-nemo-transducer-stt_de_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_transducer_models,
2119
  "csukuangfj/sherpa-onnx-nemo-transducer-stt_de_fastconformer_hybrid_large_pc-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
2120
  "csukuangfj/sherpa-onnx-nemo-stt_de_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_ctc_models,
@@ -2123,11 +2135,13 @@ german_models = {
2123
  }
2124
 
2125
  french_models = {
 
2126
  "shaojieli/sherpa-onnx-streaming-zipformer-fr-2023-04-14": _get_french_pre_trained_model,
2127
  "csukuangfj/sherpa-onnx-streaming-zipformer-fr-kroko-2025-08-06": _get_streaming_zipformer_pre_trained_model,
2128
  }
2129
 
2130
  spanish_models = {
 
2131
  "csukuangfj/sherpa-onnx-streaming-zipformer-es-kroko-2025-08-06": _get_streaming_zipformer_pre_trained_model,
2132
  }
2133
 
@@ -2138,6 +2152,7 @@ japanese_models = {
2138
  }
2139
 
2140
  russian_models = {
 
2141
  "csukuangfj/sherpa-onnx-nemo-transducer-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model,
2142
  "csukuangfj/sherpa-onnx-nemo-ctc-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model_ctc,
2143
  "csukuangfj/sherpa-onnx-nemo-transducer-giga-am-russian-2024-10-24": _get_russian_pre_trained_model,
@@ -2174,6 +2189,7 @@ vietnamese_models = {
2174
  }
2175
 
2176
  portuguese_brazlian_models = {
 
2177
  "csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_ctc_models,
2178
  "csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc-int8": _get_sherpa_onnx_nemo_ctc_models,
2179
  "csukuangfj/sherpa-onnx-nemo-transducer-stt_pt_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_transducer_models,
@@ -2182,6 +2198,7 @@ portuguese_brazlian_models = {
2182
 
2183
 
2184
  all_models = {
 
2185
  **multi_lingual_models,
2186
  **chinese_models,
2187
  **english_models,
@@ -2203,6 +2220,7 @@ all_models = {
2203
  }
2204
 
2205
  language_to_models = {
 
2206
  "Multi-lingual (east aisa)": list(multi_lingual_models.keys()),
2207
  "超多种中文方言": list(chinese_dialect_models.keys()),
2208
  "Chinese": list(chinese_models.keys()),
 
170
  return multi_lingual_models[repo_id](
171
  repo_id, decoding_method=decoding_method, num_active_paths=num_active_paths
172
  )
173
+ elif repo_id in twenty_five_languages_models:
174
+ return twenty_five_languages_models[repo_id](
175
+ repo_id, decoding_method=decoding_method, num_active_paths=num_active_paths
176
+ )
177
  elif repo_id in chinese_models:
178
  return chinese_models[repo_id](
179
  repo_id, decoding_method=decoding_method, num_active_paths=num_active_paths
 
1598
  "csukuangfj/sherpa-onnx-streaming-zipformer-en-kroko-2025-08-06",
1599
  "csukuangfj/sherpa-onnx-streaming-zipformer-es-kroko-2025-08-06",
1600
  "csukuangfj/sherpa-onnx-streaming-zipformer-fr-kroko-2025-08-06",
1601
+ "csukuangfj/sherpa-onnx-streaming-zipformer-de-kroko-2025-08-06",
1602
  ], repo_id
1603
 
1604
  if repo_id in [
1605
  "csukuangfj/sherpa-onnx-streaming-zipformer-en-kroko-2025-08-06",
1606
  "csukuangfj/sherpa-onnx-streaming-zipformer-es-kroko-2025-08-06",
1607
  "csukuangfj/sherpa-onnx-streaming-zipformer-fr-kroko-2025-08-06",
1608
+ "csukuangfj/sherpa-onnx-streaming-zipformer-de-kroko-2025-08-06",
1609
  ]:
1610
  encoder_model = _get_nn_model_filename(
1611
  repo_id=repo_id,
 
2095
  "csukuangfj/wenet-english-model": _get_wenet_model,
2096
  }
2097
 
2098
+ twenty_five_languages_models = {
2099
+ "csukuangfj/sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
2100
+ }
2101
+
2102
  multi_lingual_models = {
2103
  "csukuangfj/sherpa-onnx-dolphin-base-ctc-multi-lang-int8-2025-04-02": _get_dolphin_ctc_models,
2104
  "csukuangfj/sherpa-onnx-dolphin-small-ctc-multi-lang-int8-2025-04-02": _get_dolphin_ctc_models,
 
2125
  }
2126
 
2127
  german_models = {
2128
+ "csukuangfj/sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
2129
+ "csukuangfj/sherpa-onnx-streaming-zipformer-de-kroko-2025-08-06": _get_streaming_zipformer_pre_trained_model,
2130
  "csukuangfj/sherpa-onnx-nemo-transducer-stt_de_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_transducer_models,
2131
  "csukuangfj/sherpa-onnx-nemo-transducer-stt_de_fastconformer_hybrid_large_pc-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
2132
  "csukuangfj/sherpa-onnx-nemo-stt_de_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_ctc_models,
 
2135
  }
2136
 
2137
  french_models = {
2138
+ "csukuangfj/sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
2139
  "shaojieli/sherpa-onnx-streaming-zipformer-fr-2023-04-14": _get_french_pre_trained_model,
2140
  "csukuangfj/sherpa-onnx-streaming-zipformer-fr-kroko-2025-08-06": _get_streaming_zipformer_pre_trained_model,
2141
  }
2142
 
2143
  spanish_models = {
2144
+ "csukuangfj/sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
2145
  "csukuangfj/sherpa-onnx-streaming-zipformer-es-kroko-2025-08-06": _get_streaming_zipformer_pre_trained_model,
2146
  }
2147
 
 
2152
  }
2153
 
2154
  russian_models = {
2155
+ "csukuangfj/sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
2156
  "csukuangfj/sherpa-onnx-nemo-transducer-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model,
2157
  "csukuangfj/sherpa-onnx-nemo-ctc-giga-am-v2-russian-2025-04-19": _get_russian_pre_trained_model_ctc,
2158
  "csukuangfj/sherpa-onnx-nemo-transducer-giga-am-russian-2024-10-24": _get_russian_pre_trained_model,
 
2189
  }
2190
 
2191
  portuguese_brazlian_models = {
2192
+ "csukuangfj/sherpa-onnx-nemo-parakeet-tdt-0.6b-v3-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
2193
  "csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_ctc_models,
2194
  "csukuangfj/sherpa-onnx-nemo-stt_pt_fastconformer_hybrid_large_pc-int8": _get_sherpa_onnx_nemo_ctc_models,
2195
  "csukuangfj/sherpa-onnx-nemo-transducer-stt_pt_fastconformer_hybrid_large_pc": _get_sherpa_onnx_nemo_transducer_models,
 
2198
 
2199
 
2200
  all_models = {
2201
+ **twenty_five_languages_models,
2202
  **multi_lingual_models,
2203
  **chinese_models,
2204
  **english_models,
 
2220
  }
2221
 
2222
  language_to_models = {
2223
+ "25 European languages": list(twenty_five_languages_models.keys()),
2224
  "Multi-lingual (east aisa)": list(multi_lingual_models.keys()),
2225
  "超多种中文方言": list(chinese_dialect_models.keys()),
2226
  "Chinese": list(chinese_models.keys()),