Spaces:

LAP-DEV
/

Demo

Running

App Files Files Community

LAP-DEV commited on Jan 22

Commit

db3bab7

verified ·

1 Parent(s): db6eb06

Update modules/whisper/whisper_base.py

Browse files

Files changed (1) hide show

modules/whisper/whisper_base.py +12 -6

modules/whisper/whisper_base.py CHANGED Viewed

@@ -269,27 +269,33 @@ class WhisperBase(ABC):
                 #)
                 #files_info[file_name] = {"subtitle": subtitle, "time_for_task": time_for_task, "path": file_path, "lang": file_language, "lang_prob": file_lang_probs, "input_source_file": (file_name+file_ext)}
                 # Translate to English using Whisper built-in functionality
                 transcription_note = ""
                 if params.is_translate:
                     transcription_note = "Translated to English"
-                    file_language = "English"
                 # Translate the transcribed segments
                 translation_note = ""
                 if translate_output:
                     self.nllb_inf = NLLBInference()
-                    if file_language in NLLB_AVAILABLE_LANGS.keys():
                         transcribed_segments = self.nllb_inf.translate_text(
                             input_list_dict=transcribed_segments,
                             model_size=translate_model,
-                            src_lang=file_language,
                             tgt_lang=target_lang,
                             speaker_diarization=params.is_diarize
                         )
-                        translation_note = file_language + " to " + target_lang
                     else:
-                        translation_note = file_language + " not supported"
                 ## Get preview as txt
                 file_name, file_ext = os.path.splitext(os.path.basename(file))
@@ -338,7 +344,7 @@ class WhisperBase(ABC):
                 total_info += f'Input file: {info["input_source_file"]}\nLanguage: {info["lang"]} with probability {info["lang_prob"]}%\n'
                 if params.is_translate:
-                    total_info += f'transcription: {info["transcription"]}\n'
                 if translate_output:
                     total_info += f'Translation: {info["translation"]}\n'

                 #)
                 #files_info[file_name] = {"subtitle": subtitle, "time_for_task": time_for_task, "path": file_path, "lang": file_language, "lang_prob": file_lang_probs, "input_source_file": (file_name+file_ext)}
+                # Define source language
+                source_lang = file_language
                 # Translate to English using Whisper built-in functionality
                 transcription_note = ""
                 if params.is_translate:
                     transcription_note = "Translated to English"
+                    source_lang = "English"
                 # Translate the transcribed segments
                 translation_note = ""
                 if translate_output:
                     self.nllb_inf = NLLBInference()
+                    if source_lang in NLLB_AVAILABLE_LANGS.keys():
                         transcribed_segments = self.nllb_inf.translate_text(
                             input_list_dict=transcribed_segments,
                             model_size=translate_model,
+                            src_lang=source_lang,
                             tgt_lang=target_lang,
                             speaker_diarization=params.is_diarize
                         )
+                        if source_lang != target_lang:
+                            translation_note = source_lang + " to " + target_lang
+                        else:
+                            translation_note = source_lang + " equal to " + target_lang
                     else:
+                        translation_note = source_lang + " not supported"
                 ## Get preview as txt
                 file_name, file_ext = os.path.splitext(os.path.basename(file))
                 total_info += f'Input file: {info["input_source_file"]}\nLanguage: {info["lang"]} with probability {info["lang_prob"]}%\n'
                 if params.is_translate:
+                    total_info += f'Transcription: {info["transcription"]}\n'
                 if translate_output:
                     total_info += f'Translation: {info["translation"]}\n'