LAP-DEV commited on
Commit
3fd20ac
·
verified ·
1 Parent(s): ae8920e

Update modules/whisper/whisper_base.py

Browse files
Files changed (1) hide show
  1. modules/whisper/whisper_base.py +6 -4
modules/whisper/whisper_base.py CHANGED
@@ -224,7 +224,10 @@ class WhisperBase(ABC):
224
  files = [files]
225
  if files and isinstance(files[0], gr.utils.NamedString):
226
  files = [file.name for file in files]
227
-
 
 
 
228
  ## Load model to detect language
229
  model = whisper.load_model("base")
230
 
@@ -235,8 +238,6 @@ class WhisperBase(ABC):
235
  for file in files:
236
 
237
  ## Detect language
238
- #params = WhisperParameters.as_value(*whisper_params)
239
- #model = whisper.load_model(params.model_size)
240
  mel = whisper.log_mel_spectrogram(whisper.pad_or_trim(whisper.load_audio(file))).to(model.device)
241
  _, probs = model.detect_language(mel)
242
  file_language = ""
@@ -274,7 +275,8 @@ class WhisperBase(ABC):
274
  input_list_dict=transcribed_segments,
275
  model_size=translate_model,
276
  src_lang=file_language,
277
- tgt_lang=target_lang
 
278
  )
279
 
280
  ## Get preview as txt
 
224
  files = [files]
225
  if files and isinstance(files[0], gr.utils.NamedString):
226
  files = [file.name for file in files]
227
+
228
+ ## Load parameters related with whisper
229
+ params = WhisperParameters.as_value(*whisper_params)
230
+
231
  ## Load model to detect language
232
  model = whisper.load_model("base")
233
 
 
238
  for file in files:
239
 
240
  ## Detect language
 
 
241
  mel = whisper.log_mel_spectrogram(whisper.pad_or_trim(whisper.load_audio(file))).to(model.device)
242
  _, probs = model.detect_language(mel)
243
  file_language = ""
 
275
  input_list_dict=transcribed_segments,
276
  model_size=translate_model,
277
  src_lang=file_language,
278
+ tgt_lang=target_lang,
279
+ speaker_diarization=params.is_diarize
280
  )
281
 
282
  ## Get preview as txt