whisper-small-belarusian-demo

Sleeping

App Files Files Community

svec commited on Apr 7

Commit

1feded7

verified ·

1 Parent(s): d36c7e5

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -28

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import gradio as gr
 import pytube as pt
 from transformers import pipeline
-MODEL_NAME = "ales/whisper-small-belarusian"  # needs to stay on line 8 😄
 lang = "be"
 device = 0 if torch.cuda.is_available() else "cpu"
@@ -20,52 +20,48 @@ pipe = pipeline(
 pipe.model.config.forced_decoder_ids = pipe.tokenizer.get_decoder_prompt_ids(language=lang, task="transcribe")
-def transcribe(audio_input):
-    if audio_input is None:
-        return "ERROR: Please record or upload an audio file."
-    text = pipe(audio_input)["text"]
-    return text
-def _return_yt_html_embed(yt_url):
-    video_id = yt_url.split("?v=")[-1].split("&")[0]
-    return (
-        f'<center><iframe width="500" height="320" '
-        f'src="https://www.youtube.com/embed/{video_id}" '
-        f'frameborder="0" allowfullscreen></iframe></center>'
-    )
 def yt_transcribe(yt_url):
     if not yt_url:
         return "", "ERROR: You must provide a YouTube URL."
     yt = pt.YouTube(yt_url)
-    html_embed = _return_yt_html_embed(yt_url)
     stream = yt.streams.filter(only_audio=True).first()
     stream.download(filename="audio.mp3")
     text = pipe("audio.mp3")["text"]
-    return html_embed, text
 with gr.Blocks() as demo:
     with gr.Tab("🎤 Transcribe Audio"):
-        gr.Markdown("## 🎧 Запішы або загрузі аўдыё і атрымай транскрыпцыю")
         audio_input = gr.Audio(type="filepath", label="Record or Upload Audio")
         transcribe_button = gr.Button("Transcribe")
-        transcription_output = gr.Textbox(label="Transcribed Text")
-        transcribe_button.click(fn=transcribe, inputs=[audio_input], outputs=[transcription_output])
     with gr.Tab("📺 Transcribe YouTube"):
-        gr.Markdown("## 🎬 Устаў спасылку на відэа з YouTube і атрымай транскрыпцыю")
         yt_input = gr.Textbox(label="YouTube URL", placeholder="https://www.youtube.com/watch?v=...")
         yt_button = gr.Button("Transcribe YouTube")
-        yt_video = gr.HTML()
-        yt_transcription = gr.Textbox(label="Transcribed Text")
-        yt_button.click(fn=yt_transcribe, inputs=[yt_input], outputs=[yt_video, yt_transcription])
 demo.launch()

 import pytube as pt
 from transformers import pipeline
+MODEL_NAME = "ales/whisper-small-belarusian"
 lang = "be"
 device = 0 if torch.cuda.is_available() else "cpu"
 pipe.model.config.forced_decoder_ids = pipe.tokenizer.get_decoder_prompt_ids(language=lang, task="transcribe")
+def transcribe(audio_file):
+    if audio_file is None:
+        return "ERROR: Please upload or record audio"
+    return pipe(audio_file)["text"]
 def yt_transcribe(yt_url):
     if not yt_url:
         return "", "ERROR: You must provide a YouTube URL."
     yt = pt.YouTube(yt_url)
+    video_id = yt_url.split("?v=")[-1].split("&")[0]
+    embed = f'<center><iframe width="500" height="320" src="https://www.youtube.com/embed/{video_id}" frameborder="0" allowfullscreen></iframe></center>'
     stream = yt.streams.filter(only_audio=True).first()
     stream.download(filename="audio.mp3")
     text = pipe("audio.mp3")["text"]
+    return embed, text
 with gr.Blocks() as demo:
     with gr.Tab("🎤 Transcribe Audio"):
+        gr.Markdown("## Запішы або загрузі аўдыё")
         audio_input = gr.Audio(type="filepath", label="Record or Upload Audio")
         transcribe_button = gr.Button("Transcribe")
+        transcription_output = gr.Textbox(label="Transcription")
+        transcribe_button.click(
+            fn=transcribe,
+            inputs=[audio_input],
+            outputs=[transcription_output],
+        )
     with gr.Tab("📺 Transcribe YouTube"):
+        gr.Markdown("## Устаў спасылку на YouTube-відэа")
         yt_input = gr.Textbox(label="YouTube URL", placeholder="https://www.youtube.com/watch?v=...")
         yt_button = gr.Button("Transcribe YouTube")
+        yt_embed = gr.HTML()
+        yt_text = gr.Textbox(label="Transcription")
+        yt_button.click(
+            fn=yt_transcribe,
+            inputs=[yt_input],
+            outputs=[yt_embed, yt_text],
+        )
 demo.launch()