barto17 commited on
Commit
fe71706
·
1 Parent(s): 199ccd6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -64,7 +64,6 @@ model = WhisperForConditionalGeneration.from_pretrained(model_id)
64
  model.eval()
65
  model.to(device)
66
 
67
- sampling_rate = processor.feature_extractor.sampling_rate
68
 
69
  bos_token_id = processor.tokenizer.all_special_ids[-106]
70
  decoder_input_ids = torch.tensor([bos_token_id]).to(device)
@@ -84,7 +83,7 @@ def detect_language(sentence):
84
  return language, probability.item()
85
 
86
 
87
- def process_audio_file(file):
88
  with open(file, "rb") as f:
89
  inputs = f.read()
90
 
@@ -107,7 +106,10 @@ def transcribe(Microphone, File_Upload):
107
  else:
108
  file = File_Upload
109
 
110
- audio_data = process_audio_file(file)
 
 
 
111
 
112
  input_features = processor(audio_data, return_tensors="pt").input_features
113
 
 
64
  model.eval()
65
  model.to(device)
66
 
 
67
 
68
  bos_token_id = processor.tokenizer.all_special_ids[-106]
69
  decoder_input_ids = torch.tensor([bos_token_id]).to(device)
 
83
  return language, probability.item()
84
 
85
 
86
+ def process_audio_file(file, sampling_rate):
87
  with open(file, "rb") as f:
88
  inputs = f.read()
89
 
 
106
  else:
107
  file = File_Upload
108
 
109
+ sampling_rate = processor.feature_extractor.sampling_rate
110
+
111
+
112
+ audio_data = process_audio_file(file, sampling_rate)
113
 
114
  input_features = processor(audio_data, return_tensors="pt").input_features
115