pdzong commited on
Commit
42ad17d
·
1 Parent(s): 7d2e00c

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +16 -0
app.py ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import nemo.collections.asr as nemo_asr
2
+ import gradio as gr
3
+ import time
4
+
5
+ asr_model = nemo_asr.models.ASRModel.from_pretrained("nvidia/stt_en_conformer_transducer_xlarge")
6
+ asr_model = asr_model.cuda()
7
+
8
+ def transcribe(audio1, audio2):
9
+ mic_audio_transcription = asr_model.transcribe([audio1])[0][0] if audio1 else ""
10
+ file_audio_transcription = asr_model.transcribe([audio2])[0][0] if audio2 else ""
11
+ return mic_audio_transcription, file_audio_transcription
12
+
13
+ gr.Interface(
14
+ fn=transcribe,
15
+ inputs=[gr.Audio(source="microphone", type="filepath"), gr.Audio(source="upload", type="filepath")],
16
+ outputs=["text", "text"]).launch()