nemointent / app.py
fathyshalab's picture
Update app.py
b4a24a2
import gradio as gr
import numpy as np
from SpeechIntent import SpeechTranslate
from scipy.io.wavfile import write
speech_intent = SpeechTranslate()
def numpy_to_wavfile(audio,name="audio.wav"):
write(name, audio[0], audio[1])
return name
def reply_intent(audioarray,intent_labels):
print(intent_labels,audioarray)
audiofile = numpy_to_wavfile(audioarray)
reply_audio,intent = speech_intent.process(audiofile,intent_labels)
numpy_to_wavfile((reply_audio,22050),"output.wav")
return reply_audio,intent
reply_intent_interface = gr.Interface(
fn=reply_intent,
inputs=[gr.Audio(source="microphone",type="numpy",label="Audio"),gr.Textbox(["None","greeting","goodbye","thanks","yes","no","affirmative","negative","request","statement","question","command","other"],label="Intent")],
outputs=[gr.Audio(type="numpy",label="Reply"),gr.Textbox(label="Intent")],
title="Auto-intent",
description="Auto-intent",
allow_flagging=False,
allow_screenshot=False,
)
reply_intent_interface.launch(share=True)