import nemo.collections.asr as nemo_asr import gradio as gr def transcribe(state, file): if not audio: return {state_var: state, transcription_var: state} asr_model = nemo_asr.models.EncDecCTCModelBPE.from_pretrained(model_name="stt_rw_conformer_ctc_large") transcription= asr_model.transcribe([audio]) print(transcription) return transcription[0] with gr.Blocks() as demo: state_var = gr.State("") with gr.Row(): with gr.Column(): uploaded_audio = gr.Audio(label="Upload Audio File", type="filepath") with gr.Column(): transcription_var = gr.Textbox(type="text", label="Transcription") with gr.Row(): transcribe_button = gr.Button("Transcribe") transcribe_button.click( transcribe, [uploaded_audio], ) demo.launch()