import gradio as gr import whisper model = whisper.load_model("base") def transcribe(audio): audio = whisper.pad_or_trim(audio) mel = whisper.log_mel_spectrogram(audio).to(model.device) options = whisper.DecodingOptions() result = whisper.decode(model, mel, options) return result.text iface = gr.Interface(fn=transcribe, inputs="audio", outputs="text") iface.launch()