MMS_1_10

Running

App Files Files Community

bomolopuu commited on Oct 12, 2024

Commit

62fc325

1 Parent(s): b97df14

[s] fix to method

Browse files

Files changed (1) hide show

app.py +40 -36

app.py CHANGED Viewed

@@ -1,6 +1,4 @@
 import gradio as gr
-import librosa
-import io
 from asr import transcribe_multiple_files, ASR_LANGUAGES, model
 from lid import identify, LID_EXAMPLES
 import logging
@@ -10,49 +8,55 @@ import soundfile as sf
 logging.basicConfig(level=logging.DEBUG)
 logger = logging.getLogger(__name__)
-def safe_process_file(file_obj):
-    try:
-        logger.debug(f"Processing file: {file_obj.name}")
-        # Check if the file_obj has a 'name' attribute (NamedString)
-        if hasattr(file_obj, 'name'):
-            file_path = file_obj.name
-        else:
-            logger.error("Unexpected file object type")
-            raise ValueError("Unexpected file object type")
-        logger.debug(f"Loading audio from file path: {file_path}")
-        # Use soundfile to read the audio file
-        audio, sr = sf.read(file_path)
-        safe_name = f"audio_{hash(file_path)}.wav"
-        logger.debug(f"File processed successfully: {safe_name}")
-        return audio, sr, safe_name
-    except Exception as e:
-        logger.error(f"Error processing file {getattr(file_obj, 'name', 'unknown')}: {str(e)}")
-        raise
-def transcribe_multiple_files(audio_files, lang, transcription):
-    transcriptions = []
-    for audio_file in audio_files:
-        try:
-            audio, sr, safe_name = safe_process_file(audio_file)
-            logger.debug(f"Transcribing file: {safe_name}")
-            logger.debug(f"Language selected: {lang}")
-            logger.debug(f"User-provided transcription: {transcription}")
-            result = transcribe_multiple_files(model, audio, lang, transcription)
-            logger.debug(f"Transcription result: {result}")
-            transcriptions.append(f"File: {safe_name}\nTranscription: {result}\n")
-        except Exception as e:
-            logger.error(f"Error in transcription process: {str(e)}")
-            transcriptions.append(f"Error processing file: {str(e)}\n")
-    return "\n".join(transcriptions)
 # Prepare language options for Dropdown
 language_options = [f"{k} ({v})" for k, v in ASR_LANGUAGES.items()]
 mms_transcribe = gr.Interface(
     fn=transcribe_multiple_files,
@@ -61,7 +65,7 @@ mms_transcribe = gr.Interface(
         gr.Dropdown(
             choices=language_options,
             label="Language",
-            value=language_options[0] if language_options else None,
         ),
         gr.Textbox(label="Optional: Provide your own transcription"),
     ],

 import gradio as gr
 from asr import transcribe_multiple_files, ASR_LANGUAGES, model
 from lid import identify, LID_EXAMPLES
 import logging
 logging.basicConfig(level=logging.DEBUG)
 logger = logging.getLogger(__name__)
+# def safe_process_file(file_obj):
+#     try:
+#         logger.debug(f"Processing file: {file_obj.name}")
+#         # Check if the file_obj has a 'name' attribute (NamedString)
+#         if hasattr(file_obj, 'name'):
+#             file_path = file_obj.name
+#         else:
+#             logger.error("Unexpected file object type")
+#             raise ValueError("Unexpected file object type")
+#         logger.debug(f"Loading audio from file path: {file_path}")
+#         # Use soundfile to read the audio file
+#         audio, sr = sf.read(file_path)
+#         safe_name = f"audio_{hash(file_path)}.wav"
+#         logger.debug(f"File processed successfully: {safe_name}")
+#         return audio, sr, safe_name
+#     except Exception as e:
+#         logger.error(f"Error processing file {getattr(file_obj, 'name', 'unknown')}: {str(e)}")
+#         raise
+# def transcribe_multiple_files(audio_files, lang, transcription):
+#     transcriptions = []
+#     for audio_file in audio_files:
+#         try:
+#             audio, sr, safe_name = safe_process_file(audio_file)
+#             logger.debug(f"Transcribing file: {safe_name}")
+#             logger.debug(f"Language selected: {lang}")
+#             logger.debug(f"User-provided transcription: {transcription}")
+#             result = transcribe_multiple_files(model, audio, lang, transcription)
+#             logger.debug(f"Transcription result: {result}")
+#             transcriptions.append(f"File: {safe_name}\nTranscription: {result}\n")
+#         except Exception as e:
+#             logger.error(f"Error in transcription process: {str(e)}")
+#             transcriptions.append(f"Error processing file: {str(e)}\n")
+#     return "\n".join(transcriptions)
 # Prepare language options for Dropdown
 language_options = [f"{k} ({v})" for k, v in ASR_LANGUAGES.items()]
+bam_index = 0
+try:
+    bam_index = language_options.index("bam")
+except ValueError:
+    bam_index = 0
 mms_transcribe = gr.Interface(
     fn=transcribe_multiple_files,
         gr.Dropdown(
             choices=language_options,
             label="Language",
+            value=language_options[bam_index] if language_options else None,
         ),
         gr.Textbox(label="Optional: Provide your own transcription"),
     ],