Mihaj commited on
Commit
bf4454f
·
verified ·
1 Parent(s): aa3d808

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -0
app.py CHANGED
@@ -11,6 +11,8 @@ processor = Wav2Vec2ProcessorWithLM.from_pretrained(model_name)
11
  model = Wav2Vec2ForCTC.from_pretrained(model_name)
12
  pipe = pipeline("automatic-speech-recognition", model=model, tokenizer=processor, feature_extractor=processor.feature_extractor, decoder=processor.decoder)
13
 
 
 
14
  dict_v = ["а", "у" "о" "и" "э" "ы" "я" "ю" "е" "ё"]
15
 
16
  def count_char_borders(predicted_ids, input_values, processor, sample_rate=16000):
 
11
  model = Wav2Vec2ForCTC.from_pretrained(model_name)
12
  pipe = pipeline("automatic-speech-recognition", model=model, tokenizer=processor, feature_extractor=processor.feature_extractor, decoder=processor.decoder)
13
 
14
+ detokenize_dict = {value: key for key, value in processor.tokenizer.get_vocab().items()}
15
+
16
  dict_v = ["а", "у" "о" "и" "э" "ы" "я" "ю" "е" "ё"]
17
 
18
  def count_char_borders(predicted_ids, input_values, processor, sample_rate=16000):