|
import gradio as gr |
|
import speech_recognition as sr |
|
|
|
|
|
def audio_to_text(audio): |
|
recognizer = sr.Recognizer() |
|
with sr.AudioFile(audio) as source: |
|
audio_data = recognizer.record(source) |
|
try: |
|
|
|
text = recognizer.recognize_google(audio_data, language="es-ES") |
|
except sr.UnknownValueError: |
|
text = "No se pudo entender el audio." |
|
except sr.RequestError: |
|
text = "No se pudo conectar al servicio de reconocimiento." |
|
return text |
|
|
|
|
|
interface = gr.Interface( |
|
fn=audio_to_text, |
|
inputs=gr.Audio(sources="microphone", type="filepath"), |
|
outputs="text", |
|
title="Conversi贸n de Audio a Texto", |
|
description="Convierte audio capturado por el micr贸fono en texto utilizando reconocimiento de voz.", |
|
live=True |
|
) |
|
|
|
|
|
if __name__ == "__main__": |
|
interface.launch() |
|
|