Spaces:

unilux
/

ASR_for_Luxembourgish

Runtime error

pgilles commited on Dec 26, 2022

Commit

9ad392d

1 Parent(s): 8281394

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,8 +13,11 @@ token_key = os.environ.get("HUGGING_FACE_HUB_TOKEN")
 model_name = "unilux/whisper-large-v2-lb_cased_01"
 #p = pipeline("automatic-speech-recognition", model=model, tokenizer=tokenizer, feature_extractor=processor.feature_extractor, decoder=processor.decoder, use_auth_token=token_key)
-p = pipeline("automatic-speech-recognition", model=model_name, device=0, use_auth_token=token_key)
 def load_data(input_file):
   """ Function for resampling to ensure that the speech input is sampled at 16KHz.
@@ -27,7 +30,7 @@ def load_data(input_file):
 def asr_pipe(input_file, input_file_microphone, chunks):
   input_file = input_file_microphone if input_file_microphone else input_file
-  transcription = p(input_file, chunk_length_s= chunks, stride_length_s = None)["text"]
   return transcription
 inputs = [gr.inputs.Audio(source="upload", type='filepath', label="Eng Audio-Datei eroplueden...", optional = True),

 model_name = "unilux/whisper-large-v2-lb_cased_01"
 #p = pipeline("automatic-speech-recognition", model=model, tokenizer=tokenizer, feature_extractor=processor.feature_extractor, decoder=processor.decoder, use_auth_token=token_key)
+pipe = pipeline("automatic-speech-recognition", model=model_name, device=0, use_auth_token=token_key)
+pipe.model.config.forced_decoder_ids = pipe.tokenizer.get_decoder_prompt_ids(
+    language=lang, task="transcribe"
 def load_data(input_file):
   """ Function for resampling to ensure that the speech input is sampled at 16KHz.
 def asr_pipe(input_file, input_file_microphone, chunks):
   input_file = input_file_microphone if input_file_microphone else input_file
+  transcription = pipe(input_file, chunk_length_s= 30)["text"]
   return transcription
 inputs = [gr.inputs.Audio(source="upload", type='filepath', label="Eng Audio-Datei eroplueden...", optional = True),