whisper-asr-uz

Running

mrmuminov commited on Mar 17

Commit

9334a23

verified ·

1 Parent(s): bce555f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -38,19 +38,29 @@ def _return_yt_html_embed(yt_url):
         raise gr.Error("Invalid YouTube URL. Please check and try again.")
     return f'<center> <iframe width="500" height="320" src="https://www.youtube.com/embed/{video_id}"></iframe> </center>'
-# Transcription function
-def transcribe(inputs, task):
-    if inputs is None:
         raise gr.Error("No audio file submitted! Please upload or record an audio file before submitting your request.")
-    text = pipe(
-        {"input_features": inputs},
         batch_size=BATCH_SIZE,
-        generate_kwargs={"task": task, "forced_decoder_ids": None},
         return_timestamps=True
-    )["text"]
-    return text
 # Download YouTube audio
 def download_yt_audio(yt_url, filename):

         raise gr.Error("Invalid YouTube URL. Please check and try again.")
     return f'<center> <iframe width="500" height="320" src="https://www.youtube.com/embed/{video_id}"></iframe> </center>'
+# Transcription function (Fix applied)
+def transcribe(audio_file, task):
+    if audio_file is None:
         raise gr.Error("No audio file submitted! Please upload or record an audio file before submitting your request.")
+    # Read the audio file
+    audio_array = ffmpeg_read(audio_file, pipe.feature_extractor.sampling_rate)
+    # Convert to correct input format
+    inputs = {
+        "raw": np.array(audio_array),  # Ensure it's a NumPy array
+        "sampling_rate": pipe.feature_extractor.sampling_rate
+    }
+    # Perform transcription
+    result = pipe(
+        inputs,
         batch_size=BATCH_SIZE,
+        generate_kwargs={"task": task},
         return_timestamps=True
+    )
+    return result["text"]
 # Download YouTube audio
 def download_yt_audio(yt_url, filename):