Nathan Franklin commited on
Commit
3b38860
·
1 Parent(s): bd3e2e4

add ability to transcribe user input

Browse files
Files changed (1) hide show
  1. app.py +13 -4
app.py CHANGED
@@ -1,16 +1,21 @@
1
  import gradio as gr
 
 
 
2
 
3
  def generate_response(correction_intensity,
4
  language_level,
5
  buddy_personality,
6
  language_choice,
7
- user_query
8
  ):
9
  # Convert input audio to text
10
  # Ask llm for response to text
11
  # Convert llm response to audio
12
  # Return converted llm response
13
- return user_query
 
 
14
 
15
  demo = gr.Interface(
16
  fn=generate_response,
@@ -31,11 +36,15 @@ demo = gr.Interface(
31
  choices=['English', 'Urdu', 'Japanese'],
32
  label='Language Choice'),
33
  gr.Audio(
34
- sources=["microphone"],
 
 
35
  )],
36
  outputs=[
37
- gr.Audio(label='User Query')
 
38
  ],
39
  title="AI Language Buddy"
40
  )
 
41
  demo.launch()
 
1
  import gradio as gr
2
+ from faster_whisper import WhisperModel
3
+
4
+ model = WhisperModel("tiny")
5
 
6
  def generate_response(correction_intensity,
7
  language_level,
8
  buddy_personality,
9
  language_choice,
10
+ user_query_audio
11
  ):
12
  # Convert input audio to text
13
  # Ask llm for response to text
14
  # Convert llm response to audio
15
  # Return converted llm response
16
+ user_query_transcribed_segments, info = model.transcribe(user_query_audio)
17
+ user_query_transcribed = list(user_query_transcribed_segments)[0].text.strip()
18
+ return user_query_audio, user_query_transcribed
19
 
20
  demo = gr.Interface(
21
  fn=generate_response,
 
36
  choices=['English', 'Urdu', 'Japanese'],
37
  label='Language Choice'),
38
  gr.Audio(
39
+ # format='mp3',
40
+ show_download_button=True,
41
+ type='filepath'
42
  )],
43
  outputs=[
44
+ gr.Audio(label='User Query'),
45
+ gr.Textbox(label='AI Buddy Response')
46
  ],
47
  title="AI Language Buddy"
48
  )
49
+
50
  demo.launch()