chatGPT_voice

Runtime error

App Files Files Community

RamAnanth1 commited on Dec 8, 2022

Commit

4094da1

1 Parent(s): 49faccd

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -13

app.py CHANGED Viewed

@@ -19,9 +19,15 @@ whisper_model = pipeline(
     device=device,
 )
-# def transcribe(audio):
-#     text = whisper_model(audio)["text"]
-#     return text
 def get_response_from_chatbot(text):
     try:
@@ -147,18 +153,18 @@ with gr.Blocks(title='Talk to chatGPT') as demo:
             chatbot = gr.Chatbot(elem_id="chat_bot", visible=False).style(color_map=("green", "blue"))
             chatbot1 = gr.Chatbot(elem_id="chat_bot1").style(color_map=("green", "blue"))
         with gr.Row(elem_id="prompt_row"):
-            #prompt_input_audio = gr.Audio(label = 'Record Audio Input',source="microphone",type="filepath")
             prompt_input = gr.Textbox(lines=2, label="Input text",show_label=True)
             chat_history = gr.Textbox(lines=4, label="prompt", visible=False)
-            # transcribe_btn = gr.Button(value = "Transcribe").style(
-            #         margin=True,
-            #         rounded=(True, True, True, True),
-            #         width=100
-            #     )
-            # transcribe_btn.click(fn=transcribe,
-            #                  inputs=prompt_input_audio,
-            #                  outputs=prompt_input
-            #                 )
             submit_btn = gr.Button(value = "Submit",elem_id="submit-btn").style(
                     margin=True,
                     rounded=(True, True, True, True),

     device=device,
 )
+all_special_ids = whisper_model.tokenizer.all_special_ids
+transcribe_token_id = all_special_ids[-5]
+translate_token_id = all_special_ids[-6]
+def transcribe(audio):
+    task = "translate"
+    whisper_model.model.config.forced_decoder_ids = [[2, transcribe_token_id if task=="transcribe" else translate_token_id]]
+    text = whisper_model(audio)["text"]
+    return text
 def get_response_from_chatbot(text):
     try:
             chatbot = gr.Chatbot(elem_id="chat_bot", visible=False).style(color_map=("green", "blue"))
             chatbot1 = gr.Chatbot(elem_id="chat_bot1").style(color_map=("green", "blue"))
         with gr.Row(elem_id="prompt_row"):
+            prompt_input_audio = gr.Audio(label = 'Record Audio Input',source="microphone",type="filepath")
             prompt_input = gr.Textbox(lines=2, label="Input text",show_label=True)
             chat_history = gr.Textbox(lines=4, label="prompt", visible=False)
+            transcribe_btn = gr.Button(value = "Transcribe").style(
+                    margin=True,
+                    rounded=(True, True, True, True),
+                    width=100
+                )
+            transcribe_btn.click(fn=transcribe,
+                             inputs=prompt_input_audio,
+                             outputs=prompt_input
+                            )
             submit_btn = gr.Button(value = "Submit",elem_id="submit-btn").style(
                     margin=True,
                     rounded=(True, True, True, True),