from transformers import pipeline import gradio as gr import time import unicodedata p = pipeline("automatic-speech-recognition",model="kingabzpro/wav2vec2-large-xls-r-300m-Urdu") def transcribe(audio, state=""): time.sleep(2) text = p(audio)["text"] state += unicodedata.normalize("NFC",text) + " " return state, state ################### Gradio Web APP ################################ title = "Real-Time Urdu ASR" description = """
Fine-tuning XLS-R for Multi-Lingual ASR with 🤗 Transformers