csukuangfj commited on
Commit
0986216
·
1 Parent(s): 4ceafea

add nemo parakeet-tdt-0.6b-v2

Browse files
Files changed (2) hide show
  1. model.py +47 -0
  2. requirements.txt +1 -1
model.py CHANGED
@@ -1270,6 +1270,52 @@ def _get_french_pre_trained_model(
1270
  return recognizer
1271
 
1272
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1273
  @lru_cache(maxsize=10)
1274
  def _get_sherpa_onnx_nemo_transducer_models(
1275
  repo_id: str,
@@ -1860,6 +1906,7 @@ chinese_models = {
1860
  }
1861
 
1862
  english_models = {
 
1863
  "whisper-tiny.en": _get_whisper_model,
1864
  "moonshine-tiny": _get_moonshine_model,
1865
  "moonshine-base": _get_moonshine_model,
 
1270
  return recognizer
1271
 
1272
 
1273
+ @lru_cache(maxsize=10)
1274
+ def _get_sherpa_onnx_nemo_transducer_models_int8(
1275
+ repo_id: str,
1276
+ decoding_method: str,
1277
+ num_active_paths: int,
1278
+ ) -> sherpa_onnx.OfflineRecognizer:
1279
+ assert repo_id in [
1280
+ "csukuangfj/sherpa-onnx-nemo-parakeet-tdt-0.6b-v2-int8",
1281
+ ], repo_id
1282
+
1283
+ encoder_model = _get_nn_model_filename(
1284
+ repo_id=repo_id,
1285
+ filename="encoder.int8.onnx",
1286
+ subfolder=".",
1287
+ )
1288
+
1289
+ decoder_model = _get_nn_model_filename(
1290
+ repo_id=repo_id,
1291
+ filename="decoder.int8.onnx",
1292
+ subfolder=".",
1293
+ )
1294
+
1295
+ joiner_model = _get_nn_model_filename(
1296
+ repo_id=repo_id,
1297
+ filename="joiner.int8.onnx",
1298
+ subfolder=".",
1299
+ )
1300
+
1301
+ tokens = _get_token_filename(repo_id=repo_id, subfolder=".")
1302
+
1303
+ recognizer = sherpa_onnx.OfflineRecognizer.from_transducer(
1304
+ tokens=tokens,
1305
+ encoder=encoder_model,
1306
+ decoder=decoder_model,
1307
+ joiner=joiner_model,
1308
+ num_threads=2,
1309
+ sample_rate=16000,
1310
+ feature_dim=128, # no used
1311
+ model_type="nemo_transducer",
1312
+ decoding_method=decoding_method,
1313
+ max_active_paths=num_active_paths,
1314
+ )
1315
+
1316
+ return recognizer
1317
+
1318
+
1319
  @lru_cache(maxsize=10)
1320
  def _get_sherpa_onnx_nemo_transducer_models(
1321
  repo_id: str,
 
1906
  }
1907
 
1908
  english_models = {
1909
+ "csukuangfj/sherpa-onnx-nemo-parakeet-tdt-0.6b-v2-int8": _get_sherpa_onnx_nemo_transducer_models_int8,
1910
  "whisper-tiny.en": _get_whisper_model,
1911
  "moonshine-tiny": _get_moonshine_model,
1912
  "moonshine-base": _get_moonshine_model,
requirements.txt CHANGED
@@ -10,6 +10,6 @@ numpy<2
10
 
11
  huggingface_hub
12
 
13
- #https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/cpu/1.11.3/sherpa_onnx-1.11.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
14
 
15
  sherpa-onnx>=1.11.3
 
10
 
11
  huggingface_hub
12
 
13
+ https://huggingface.co/csukuangfj/sherpa-onnx-wheels/resolve/main/cpu/1.11.4/sherpa_onnx-1.11.4-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl
14
 
15
  sherpa-onnx>=1.11.3