Spaces:

Lenylvt
/

Whisper-API

Sleeping

Lenylvt commited on Feb 17, 2024

Commit

30d58a1

verified ·

1 Parent(s): 1a8b6da

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,21 +5,15 @@ import whisper
 model = whisper.load_model("base")
 def transcribe(audio_file):
-    # Process the audio file
-    audio = whisper.load_audio(audio_file.name)
-    audio = whisper.pad_or_trim(audio)
-    # Make predictions
-    mel = whisper.log_mel_spectrogram(audio).to(model.device)
-    options = whisper.DecodingOptions(fp16=False)
-    result = whisper.decode(model, mel, options)
     # Return the transcription
-    return result.text
 # Create the Gradio interface
 iface = gr.Interface(fn=transcribe,
-                     inputs=gr.Audio(sources="upload", type="filepath"),
                      outputs="text",
                      title="Whisper Transcription",
                      description="Upload an audio file to transcribe it using OpenAI's Whisper model.")

 model = whisper.load_model("base")
 def transcribe(audio_file):
+    # Process the audio file directly with the file path
+    result = model.transcribe(audio_file)
     # Return the transcription
+    return result['text']
 # Create the Gradio interface
 iface = gr.Interface(fn=transcribe,
+                     inputs=gr.inputs.Audio(sources="upload", type="file", label="Upload Audio"),
                      outputs="text",
                      title="Whisper Transcription",
                      description="Upload an audio file to transcribe it using OpenAI's Whisper model.")