File size: 455 Bytes
96de449
b4b36f0
96de449
 
b4b36f0
96de449
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
from transformers import pipeline
import gradio as gr
import numpy as np
import librosa

transcriber_gujarati = pipeline("automatic-speech-recognition", model="ai4bharat/indicwav2vec_v1_gujarati")

def transcribe(audio):
    sr,y = audio
    y = y.astype(np.float32)
    y/= np.max(np.abs(y))
    return transcriber_gujarati(librosa.resample(y=y, orig_sr=sr, target_sr=16000))["text"]

gr.Interface(transcribe,inputs="microphone",outputs="text").launch()