|
import gradio as gr |
|
import requests |
|
import youtube_dl |
|
from typing import Optional |
|
import json |
|
import subprocess |
|
import os |
|
import tempfile |
|
|
|
|
|
API_URL = "http://astarwiz.com:9998" |
|
|
|
def download_youtube_audio(url: str, output_dir: Optional[str] = None) -> str: |
|
if output_dir is None: |
|
output_dir = tempfile.gettempdir() |
|
|
|
ydl_opts = { |
|
'format': 'bestaudio/best', |
|
'extractaudio': True, |
|
'audioformat': 'mp3', |
|
'outtmpl': os.path.join(output_dir, '%(title)s.%(ext)s'), |
|
'noplaylist': True, |
|
} |
|
|
|
try: |
|
with youtube_dl.YoutubeDL(ydl_opts) as ydl: |
|
info_dict = ydl.extract_info(url, download=True) |
|
audio_file = os.path.join(output_dir, f"{info_dict['title']}.mp3") |
|
|
|
print(f"Successfully downloaded: {audio_file}") |
|
return audio_file |
|
except Exception as e: |
|
raise Exception(f"Error downloading YouTube audio: {str(e)}") |
|
|
|
def run_asr(audio_file, youtube_url): |
|
temp_file = None |
|
try: |
|
if youtube_url: |
|
|
|
audio_file = download_youtube_audio(youtube_url) |
|
temp_file = audio_file |
|
elif not audio_file: |
|
return "Please provide either an audio file or a YouTube URL." |
|
|
|
files = {'file': open(audio_file, 'rb')} |
|
data = {'language': 'en', 'model_name': 'whisper-large-v2-imda'} |
|
response = requests.post(f"{API_URL}/asr", data=data, files=files) |
|
|
|
if response.status_code == 200: |
|
return response.json().get("text", "") |
|
else: |
|
return f"Error: {response.status_code}" |
|
except Exception as e: |
|
return f"Error: {str(e)}" |
|
finally: |
|
|
|
if temp_file and os.path.exists(temp_file): |
|
os.remove(temp_file) |
|
|
|
def embed_youtube(youtube_url): |
|
if youtube_url: |
|
try: |
|
|
|
video_id = youtube_url.split("v=")[1] |
|
if 'short' in youtube_url: |
|
video_id = video_id.split("/")[-1] |
|
print(video_id) |
|
embed_html = f'<iframe width="560" height="315" src="https://www.youtube.com/embed/{video_id}" frameborder="0" allow="autoplay; encrypted-media" allowfullscreen></iframe>' |
|
return gr.update(value=embed_html, visible=True), "", None |
|
except: |
|
return gr.update(value="", visible=False), "Invalid YouTube URL", None |
|
return gr.update(value="", visible=False), "", None |
|
|
|
def clear_on_audio_input(audio): |
|
if audio is not None: |
|
return "", gr.update(value="", visible=False), "" |
|
return gr.update(), gr.update(), gr.update() |
|
|
|
|
|
with gr.Blocks(theme=gr.themes.Soft()) as demo: |
|
gr.Markdown("# ποΈ Audio Transcription Service") |
|
gr.Markdown("Upload an audio file, record your voice, or paste a YouTube URL to get an English transcription.") |
|
|
|
with gr.Row(): |
|
with gr.Column(scale=2): |
|
audio_input = gr.Audio(sources=['microphone', 'upload'], type="filepath", label="Audio Input") |
|
youtube_input = gr.Textbox(label="YouTube URL", placeholder="Or paste a YouTube URL here...") |
|
video_player = gr.HTML(visible=False) |
|
with gr.Column(scale=3): |
|
result = gr.Textbox( |
|
label="Transcription Result", |
|
placeholder="Your transcription will appear here...", |
|
lines=10 |
|
) |
|
|
|
run_button = gr.Button("π Transcribe Audio", variant="primary") |
|
run_button.click(run_asr, inputs=[audio_input, youtube_input], outputs=[result]) |
|
|
|
|
|
youtube_input.change( |
|
fn=embed_youtube, |
|
inputs=[youtube_input], |
|
outputs=[video_player, result, audio_input] |
|
) |
|
|
|
|
|
audio_input.change( |
|
fn=clear_on_audio_input, |
|
inputs=[audio_input], |
|
outputs=[result, video_player, youtube_input] |
|
) |
|
|
|
gr.Markdown("### How to use:") |
|
gr.Markdown("1. Upload an audio file or record your voice using the microphone, OR paste a YouTube URL.") |
|
gr.Markdown("2. If you paste a YouTube URL, the video will be displayed for your reference, and any previous transcription or audio input will be cleared.") |
|
gr.Markdown("3. If you upload or record audio, any previous transcription, YouTube URL, and video will be cleared.") |
|
gr.Markdown("4. Click the 'Transcribe Audio' button to start the process.") |
|
gr.Markdown("5. Wait for a few seconds, and your transcription will appear in the result box.") |
|
|
|
|
|
demo.launch() |
|
|