Spaces:
Runtime error
Runtime error
Nathan Franklin
commited on
Commit
·
3b38860
1
Parent(s):
bd3e2e4
add ability to transcribe user input
Browse files
app.py
CHANGED
@@ -1,16 +1,21 @@
|
|
1 |
import gradio as gr
|
|
|
|
|
|
|
2 |
|
3 |
def generate_response(correction_intensity,
|
4 |
language_level,
|
5 |
buddy_personality,
|
6 |
language_choice,
|
7 |
-
|
8 |
):
|
9 |
# Convert input audio to text
|
10 |
# Ask llm for response to text
|
11 |
# Convert llm response to audio
|
12 |
# Return converted llm response
|
13 |
-
|
|
|
|
|
14 |
|
15 |
demo = gr.Interface(
|
16 |
fn=generate_response,
|
@@ -31,11 +36,15 @@ demo = gr.Interface(
|
|
31 |
choices=['English', 'Urdu', 'Japanese'],
|
32 |
label='Language Choice'),
|
33 |
gr.Audio(
|
34 |
-
|
|
|
|
|
35 |
)],
|
36 |
outputs=[
|
37 |
-
gr.Audio(label='User Query')
|
|
|
38 |
],
|
39 |
title="AI Language Buddy"
|
40 |
)
|
|
|
41 |
demo.launch()
|
|
|
1 |
import gradio as gr
|
2 |
+
from faster_whisper import WhisperModel
|
3 |
+
|
4 |
+
model = WhisperModel("tiny")
|
5 |
|
6 |
def generate_response(correction_intensity,
|
7 |
language_level,
|
8 |
buddy_personality,
|
9 |
language_choice,
|
10 |
+
user_query_audio
|
11 |
):
|
12 |
# Convert input audio to text
|
13 |
# Ask llm for response to text
|
14 |
# Convert llm response to audio
|
15 |
# Return converted llm response
|
16 |
+
user_query_transcribed_segments, info = model.transcribe(user_query_audio)
|
17 |
+
user_query_transcribed = list(user_query_transcribed_segments)[0].text.strip()
|
18 |
+
return user_query_audio, user_query_transcribed
|
19 |
|
20 |
demo = gr.Interface(
|
21 |
fn=generate_response,
|
|
|
36 |
choices=['English', 'Urdu', 'Japanese'],
|
37 |
label='Language Choice'),
|
38 |
gr.Audio(
|
39 |
+
# format='mp3',
|
40 |
+
show_download_button=True,
|
41 |
+
type='filepath'
|
42 |
)],
|
43 |
outputs=[
|
44 |
+
gr.Audio(label='User Query'),
|
45 |
+
gr.Textbox(label='AI Buddy Response')
|
46 |
],
|
47 |
title="AI Language Buddy"
|
48 |
)
|
49 |
+
|
50 |
demo.launch()
|