Spaces:
Sleeping
Sleeping
File size: 1,425 Bytes
0cfe2ed 896746e 0cfe2ed 896746e 0cfe2ed 896746e 0cfe2ed |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 |
import speech_recognition as sr
from gtts import gTTS
import os
import wave
def record_audio(filename, sec=5, sr=44100):
# Initialize recognizer class (for recognizing speech)
recognizer = sr.Recognizer()
# Set the microphone for recording
with sr.Microphone() as source:
print("Recording... Speak now!")
recognizer.adjust_for_ambient_noise(source) # Adjust for ambient noise
audio = recognizer.listen(source, timeout=sec)
# Save the audio to a file
with open(filename, "wb") as f:
f.write(audio.get_wav_data())
def transcribe_audio(filename):
recognizer = sr.Recognizer()
with sr.AudioFile(filename) as source:
audio = recognizer.record(source)
try:
# Recognize speech using Google's speech recognition
transcript = recognizer.recognize_google(audio)
return {"text": transcript}
except sr.UnknownValueError:
return {"text": "Sorry, I could not understand the audio."}
except sr.RequestError as e:
return {"text": f"Request failed; {e}"}
def save_text_as_audio(text, audio_filename):
tts = gTTS(text=text, lang='en', slow=False)
tts.save(audio_filename)
def play_audio(filename):
# Play audio using the default system player (e.g., vlc, mplayer)
os.system(f"start {filename}") # For Windows; on Linux/macOS use `os.system(f"mpg321 {filename}")`
|