flozi00 commited on
Commit
ee00afc
·
1 Parent(s): c0f356c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -4
app.py CHANGED
@@ -7,7 +7,6 @@ from pyctcdecode import BeamSearchDecoderCTC
7
  lmID = "aware-ai/german-lowercase-4gram-kenlm"
8
  decoder = BeamSearchDecoderCTC.load_from_hf_hub(lmID)
9
  p = pipeline("automatic-speech-recognition", model="aware-ai/robust-wav2vec2-base-german-lowercase", decoder=decoder)
10
- ttp = pipeline("text2text-generation", model="aware-ai/marian-german-grammar")
11
 
12
  model = M2M100ForConditionalGeneration.from_pretrained("facebook/m2m100_1.2B")
13
  tokenizer = M2M100Tokenizer.from_pretrained("facebook/m2m100_1.2B")
@@ -24,10 +23,9 @@ def translate(src, tgt, text):
24
  return result
25
 
26
  def transcribe(audio):
27
- transcribed = p(audio, chunk_length_s=10, stride_length_s=(4, 2))["text"].lower()
28
- transcribed_corrected = ttp(re.sub("[^a-zA-Z0-9öäüÖÄÜ ]", " ",transcribed))[0]["generated_text"]
29
 
30
- return transcribed_corrected
31
 
32
  def get_asr_interface():
33
  return gr.Interface(
 
7
  lmID = "aware-ai/german-lowercase-4gram-kenlm"
8
  decoder = BeamSearchDecoderCTC.load_from_hf_hub(lmID)
9
  p = pipeline("automatic-speech-recognition", model="aware-ai/robust-wav2vec2-base-german-lowercase", decoder=decoder)
 
10
 
11
  model = M2M100ForConditionalGeneration.from_pretrained("facebook/m2m100_1.2B")
12
  tokenizer = M2M100Tokenizer.from_pretrained("facebook/m2m100_1.2B")
 
23
  return result
24
 
25
  def transcribe(audio):
26
+ transcribed = p(audio, chunk_length_s=10, stride_length_s=(4, 2))["text"]
 
27
 
28
+ return transcribed
29
 
30
  def get_asr_interface():
31
  return gr.Interface(