Spaces:
Sleeping
Sleeping
File size: 836 Bytes
1d0f027 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 |
import whisper
import speech_recognition as sr
from pydub import AudioSegment
def transcribe_speech_recognition(file_path):
r = sr.Recognizer()
audio_file = sr.AudioFile(file_path)
with audio_file as source:
audio = r.record(source)
transcription_result = r.recognize_google(audio, language="es")
return transcription_result
# Function to convert mp3 file to wav
def convert_mp3_to_wav(mp3_path):
audio = AudioSegment.from_mp3(mp3_path)
wav_path = mp3_path.replace('.mp3', '.wav')
audio.export(wav_path, format="wav")
return wav_path
# Function to transcribe audio using OpenAI Whisper
def transcribe_whisper(file_path):
# models = ['base', 'small', 'medium', 'large', 'tiny']
model = whisper.load_model("base")
result = model.transcribe(file_path)
return result["text"]
|