Spaces:

shamimjony1000
/

tai

Sleeping

App Files Files Community

tai / voice_handler.py

shamimjony1000

Update voice_handler.py

f896422 verified about 1 month ago

raw

history blame contribute delete

2.92 kB

	import speech_recognition as sr

	class VoiceHandler:
	def __init__(self):
	self.recognizer = sr.Recognizer()
	self.recognizer.energy_threshold = 4000
	self.recognizer.dynamic_energy_threshold = True
	self.recognizer.pause_threshold = 0.8
	self.permission_granted = False

	def check_microphone_access(self) -> bool:
	"""Check if microphone is accessible."""
	try:
	with sr.Microphone() as source:
	self.recognizer.adjust_for_ambient_noise(source, duration=0.1)
	return True
	except OSError as e:
	print("OSError: Microphone not accessible. Please check your microphone connection and ALSA configuration.")
	print(f"Details: {str(e)}")
	return False
	except Exception as e:
	print(f"Unexpected error while accessing microphone: {str(e)}")
	return False

	def request_permissions(self) -> bool:
	"""Request microphone permissions."""
	try:
	if self.check_microphone_access():
	self.permission_granted = True
	return True
	return False
	except Exception as e:
	print(f"Error requesting permissions: {str(e)}")
	return False

	def listen_for_voice(self, language: str = "mixed") -> str:
	if not self.permission_granted and not self.request_permissions():
	return "Error: Microphone permissions required."

	try:
	with sr.Microphone() as source:
	print("Adjusting for ambient noise...")
	self.recognizer.adjust_for_ambient_noise(source, duration=1)
	print("Listening...")
	audio = self.recognizer.listen(source, timeout=5, phrase_time_limit=10)
	print("Processing speech...")
	return self._process_audio(audio, language)

	except sr.RequestError as e:
	return f"Could not request results from speech service: {str(e)}"
	except sr.UnknownValueError:
	return "Could not understand audio. Please try again."
	except sr.WaitTimeoutError:
	return "Listening timed out. Please try again."
	except OSError as e:
	return "OSError: Microphone not accessible. Check your connection and ALSA configuration."
	except Exception as e:
	return f"Error: {str(e)}"

	def _process_audio(self, audio, language: str) -> str:
	if language in ["ar-SA", "mixed"]:
	try:
	return self.recognizer.recognize_google(audio, language="ar-SA")
	except sr.UnknownValueError:
	if language == "mixed":
	return self.recognizer.recognize_google(audio, language="en-US")
	raise
	return self.recognizer.recognize_google(audio, language="en-US")