Update modules/whisper/whisper_base.py
Browse files
modules/whisper/whisper_base.py
CHANGED
@@ -224,7 +224,10 @@ class WhisperBase(ABC):
|
|
224 |
files = [files]
|
225 |
if files and isinstance(files[0], gr.utils.NamedString):
|
226 |
files = [file.name for file in files]
|
227 |
-
|
|
|
|
|
|
|
228 |
## Load model to detect language
|
229 |
model = whisper.load_model("base")
|
230 |
|
@@ -235,8 +238,6 @@ class WhisperBase(ABC):
|
|
235 |
for file in files:
|
236 |
|
237 |
## Detect language
|
238 |
-
#params = WhisperParameters.as_value(*whisper_params)
|
239 |
-
#model = whisper.load_model(params.model_size)
|
240 |
mel = whisper.log_mel_spectrogram(whisper.pad_or_trim(whisper.load_audio(file))).to(model.device)
|
241 |
_, probs = model.detect_language(mel)
|
242 |
file_language = ""
|
@@ -274,7 +275,8 @@ class WhisperBase(ABC):
|
|
274 |
input_list_dict=transcribed_segments,
|
275 |
model_size=translate_model,
|
276 |
src_lang=file_language,
|
277 |
-
tgt_lang=target_lang
|
|
|
278 |
)
|
279 |
|
280 |
## Get preview as txt
|
|
|
224 |
files = [files]
|
225 |
if files and isinstance(files[0], gr.utils.NamedString):
|
226 |
files = [file.name for file in files]
|
227 |
+
|
228 |
+
## Load parameters related with whisper
|
229 |
+
params = WhisperParameters.as_value(*whisper_params)
|
230 |
+
|
231 |
## Load model to detect language
|
232 |
model = whisper.load_model("base")
|
233 |
|
|
|
238 |
for file in files:
|
239 |
|
240 |
## Detect language
|
|
|
|
|
241 |
mel = whisper.log_mel_spectrogram(whisper.pad_or_trim(whisper.load_audio(file))).to(model.device)
|
242 |
_, probs = model.detect_language(mel)
|
243 |
file_language = ""
|
|
|
275 |
input_list_dict=transcribed_segments,
|
276 |
model_size=translate_model,
|
277 |
src_lang=file_language,
|
278 |
+
tgt_lang=target_lang,
|
279 |
+
speaker_diarization=params.is_diarize
|
280 |
)
|
281 |
|
282 |
## Get preview as txt
|