whisper-asr-uz

Running

mrmuminov commited on 11 days ago

Commit

891b8fc

verified ·

1 Parent(s): 9334a23

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -41,27 +41,30 @@ def _return_yt_html_embed(yt_url):
 # Transcription function (Fix applied)
 def transcribe(audio_file, task):
     if audio_file is None:
-        raise gr.Error("No audio file submitted! Please upload or record an audio file before submitting your request.")
-    # Read the audio file
-    audio_array = ffmpeg_read(audio_file, pipe.feature_extractor.sampling_rate)
-    # Convert to correct input format
     inputs = {
-        "raw": np.array(audio_array),  # Ensure it's a NumPy array
         "sampling_rate": pipe.feature_extractor.sampling_rate
     }
     # Perform transcription
     result = pipe(
-        inputs,
-        batch_size=BATCH_SIZE,
-        generate_kwargs={"task": task},
         return_timestamps=True
     )
     return result["text"]
 # Download YouTube audio
 def download_yt_audio(yt_url, filename):
     ydl_opts = {

 # Transcription function (Fix applied)
 def transcribe(audio_file, task):
     if audio_file is None:
+        raise gr.Error("No audio file submitted! Please upload or record an audio file before submitting.")
+    # Open file as binary to ensure correct data type
+    with open(audio_file, "rb") as f:
+        audio_data = f.read()
+    # Read audio using ffmpeg_read (correcting input format)
+    audio_array = ffmpeg_read(audio_data, pipe.feature_extractor.sampling_rate)
+    # Convert to proper format
     inputs = {
+        "raw": np.array(audio_array),
         "sampling_rate": pipe.feature_extractor.sampling_rate
     }
     # Perform transcription
     result = pipe(
+        inputs,
+        batch_size=BATCH_SIZE,
+        generate_kwargs={"task": task},
         return_timestamps=True
     )
     return result["text"]
 # Download YouTube audio
 def download_yt_audio(yt_url, filename):
     ydl_opts = {