MMS_1_10

Sleeping

bomolopuu commited on Oct 1, 2024

Commit

7b359fc

1 Parent(s): 1c261b8

new approach to null

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,33 +1,38 @@
 import gradio as gr
 import librosa
 import os
 from asr import transcribe, ASR_LANGUAGES, model
 from lid import identify, LID_EXAMPLES
-def safe_file_name(file_path):
     try:
-        # Remove null characters from the file name
-        safe_name = file_path.replace('\0', '')
-        # Get just the file name, not the full path
-        return os.path.basename(safe_name)
     except Exception as e:
-        return f"Unknown_File_{hash(file_path)}"
 def transcribe_multiple_files(audio_files, lang, transcription):
     transcriptions = []
     for audio_file in audio_files:
         try:
-            # Use a safe file name
-            safe_name = safe_file_name(audio_file.name)
-            # Attempt to load the audio file
-            audio, sr = librosa.load(audio_file.name)
-            # Perform transcription
             result = transcribe(model, audio, lang, transcription)
             transcriptions.append(f"File: {safe_name}\nTranscription: {result}\n")
         except Exception as e:
-            transcriptions.append(f"Error processing {safe_name}: {str(e)}\n")
     return "\n".join(transcriptions)
 mms_transcribe = gr.Interface(

 import gradio as gr
 import librosa
 import os
+import tempfile
+import shutil
 from asr import transcribe, ASR_LANGUAGES, model
 from lid import identify, LID_EXAMPLES
+def safe_process_file(file_obj):
     try:
+        # Create a temporary directory
+        with tempfile.TemporaryDirectory() as temp_dir:
+            # Generate a safe file name
+            safe_name = f"audio_{hash(file_obj.name)}.wav"
+            temp_path = os.path.join(temp_dir, safe_name)
+            # Copy the file to the temporary directory
+            shutil.copy(file_obj.name, temp_path)
+            # Load the audio from the temporary file
+            audio, sr = librosa.load(temp_path)
+            return audio, sr, safe_name
     except Exception as e:
+        raise Exception(f"Error processing file: {str(e)}")
 def transcribe_multiple_files(audio_files, lang, transcription):
     transcriptions = []
     for audio_file in audio_files:
         try:
+            audio, sr, safe_name = safe_process_file(audio_file)
             result = transcribe(model, audio, lang, transcription)
             transcriptions.append(f"File: {safe_name}\nTranscription: {result}\n")
         except Exception as e:
+            transcriptions.append(f"Error processing file: {str(e)}\n")
     return "\n".join(transcriptions)
 mms_transcribe = gr.Interface(