AshwinSankar commited on
Commit
9ce0c61
·
verified ·
1 Parent(s): 3adc88c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -68,12 +68,12 @@ DEFAULT_TARGET_LANGUAGE = "Bengali"
68
  @spaces.GPU
69
  def run_asr_ctc(input_audio: str, target_language: str) -> str:
70
  # preprocess_audio(input_audio)
71
- input_audio, orig_freq = torchaudio.load(input_audio)
72
- input_audio = torchaudio.functional.resample(input_audio, orig_freq=orig_freq, new_freq=16000)
73
  lang_id = LANGUAGE_NAME_TO_CODE[target_language]
74
 
75
  model.cur_decoder = "ctc"
76
- ctc_text = model.transcribe(['sample_audio_infer_ready.wav'], batch_size=1,logprobs=False, language_id=lang_id)[0]
77
 
78
  return ctc_text
79
 
@@ -85,7 +85,7 @@ def run_asr_rnnt(input_audio: str, target_language: str) -> str:
85
  lang_id = LANGUAGE_NAME_TO_CODE[target_language]
86
 
87
  model.cur_decoder = "rnnt"
88
- ctc_text = model.transcribe(['sample_audio_infer_ready.wav'], batch_size=1,logprobs=False, language_id=lang_id)[0]
89
 
90
  return ctc_text
91
 
 
68
  @spaces.GPU
69
  def run_asr_ctc(input_audio: str, target_language: str) -> str:
70
  # preprocess_audio(input_audio)
71
+ # input_audio, orig_freq = torchaudio.load(input_audio)
72
+ # input_audio = torchaudio.functional.resample(input_audio, orig_freq=orig_freq, new_freq=16000)
73
  lang_id = LANGUAGE_NAME_TO_CODE[target_language]
74
 
75
  model.cur_decoder = "ctc"
76
+ ctc_text = model.transcribe([input_audio], batch_size=1, logprobs=False, language_id=lang_id)[0]
77
 
78
  return ctc_text
79
 
 
85
  lang_id = LANGUAGE_NAME_TO_CODE[target_language]
86
 
87
  model.cur_decoder = "rnnt"
88
+ ctc_text = model.transcribe([input_audio], batch_size=1,logprobs=False, language_id=lang_id)[0]
89
 
90
  return ctc_text
91