Spaces:

Gigaverse
/

ivrit-ai-streaming

Sleeping

ivrit-ai-streaming / client.py

AshDavid12

complete change

5a62402 10 months ago

6.36 kB

	import asyncio
	import websockets
	import requests
	import ssl
	import wave
	import logging
	import sys

	# Parameters for reading and sending the audio
	AUDIO_FILE_URL = "https://raw.githubusercontent.com/AshDavid12/runpod-serverless-forked/main/test_hebrew.wav" # Use WAV file
	#AUDIO_FILE_URL = "https://raw.githubusercontent.com/AshDavid12/hugging_face_ivrit_streaming/main/long_hebrew.wav"



	# Set up logging
	logging.basicConfig(level=logging.DEBUG, format='%(asctime)s %(levelname)s: %(message)s',
	handlers=[logging.StreamHandler(sys.stdout)], force=True)
	logger = logging.getLogger(__name__)

	async def send_receive():
	uri = "wss://gigaverse-ivrit-ai-streaming.hf.space/ws" # Update with your server's address if needed
	logger.info(f"Connecting to server at {uri}")
	try:
	async with websockets.connect(uri) as websocket:
	logger.info("WebSocket connection established")
	# Start tasks for sending and receiving
	send_task = asyncio.create_task(send_audio(websocket))
	receive_task = asyncio.create_task(receive_transcriptions(websocket))
	await asyncio.gather(send_task, receive_task)
	except Exception as e:
	logger.error(f"WebSocket connection error: {e}")

	async def send_audio(websocket):
	wav_file = 'path/to/your/audio.wav' # Replace with the path to your WAV file
	logger.info(f"Opening WAV file: {wav_file}")

	try:
	# Open the WAV file
	wf = wave.open(wav_file, 'rb')

	# Log WAV file parameters
	channels = wf.getnchannels()
	sampwidth = wf.getsampwidth()
	framerate = wf.getframerate()
	nframes = wf.getnframes()
	duration = nframes / framerate
	logger.debug(f"WAV file parameters: channels={channels}, sample_width={sampwidth}, framerate={framerate}, frames={nframes}, duration={duration:.2f}s")

	# Ensure the WAV file has the expected parameters
	if channels != 1 or sampwidth != 2 or framerate != 16000:
	logger.error("WAV file must be mono channel, 16-bit samples, 16kHz sampling rate")
	return

	chunk_duration = 0.1 # in seconds
	chunk_size = int(framerate * chunk_duration)
	logger.info(f"Starting to send audio data in chunks of {chunk_duration}s ({chunk_size} frames)")

	total_chunks = 0
	total_bytes_sent = 0

	while True:
	data = wf.readframes(chunk_size)
	if not data:
	logger.info("End of WAV file reached")
	break
	await websocket.send(data)
	total_chunks += 1
	total_bytes_sent += len(data)
	logger.debug(f"Sent chunk {total_chunks}: {len(data)} bytes")
	await asyncio.sleep(chunk_duration) # Simulate real-time streaming

	logger.info(f"Finished sending audio data: {total_chunks} chunks sent, total bytes sent: {total_bytes_sent}")
	except Exception as e:
	logger.error(f"Send audio error: {e}")
	finally:
	wf.close()
	logger.info("WAV file closed")

	async def receive_transcriptions(websocket):
	try:
	logger.info("Starting to receive transcriptions")
	async for message in websocket: # This is the same as websocket.recv()
	logger.info(f"Received transcription: {message}")
	print(f"Transcription: {message}")
	except Exception as e:
	logger.error(f"Receive transcription error: {e}")

	if __name__ == "__main__":
	asyncio.run(send_receive())














	# async def send_audio(websocket):
	# buffer_size = 512 * 1024 #HAVE TO HAVE 512!!
	# audio_buffer = bytearray()
	#
	# with requests.get(AUDIO_FILE_URL, stream=True, allow_redirects=False) as response:
	# if response.status_code == 200:
	# print("Starting to stream audio file...")
	#
	# for chunk in response.iter_content(chunk_size=1024): # Stream in chunks
	# if chunk:
	# audio_buffer.extend(chunk)
	# #print(f"Received audio chunk of size {len(chunk)} bytes.")
	#
	# # Send buffered audio data once it's large enough
	# if len(audio_buffer) >= buffer_size:
	# await websocket.send(audio_buffer)
	# #print(f"Sent {len(audio_buffer)} bytes of audio data.")
	# audio_buffer.clear()
	# await asyncio.sleep(0.01)
	#
	# print("Finished sending audio.")
	# else:
	# print(f"Failed to download audio file. Status code: {response.status_code}")
	#
	#
	# async def receive_transcription(websocket):
	# while True:
	# try:
	#
	# transcription = await websocket.recv()
	# # Receive transcription from the server
	# print(f"Transcription: {transcription}")
	# except Exception as e:
	# print(f"Error receiving transcription: {e}")
	# #await asyncio.sleep(30)
	# break
	#
	#
	# async def send_heartbeat(websocket):
	# while True:
	# try:
	# await websocket.ping()
	# print("Sent keepalive ping")
	# except websockets.ConnectionClosed:
	# print("Connection closed, stopping heartbeat")
	# break
	# await asyncio.sleep(30) # Send ping every 30 seconds (adjust as needed)
	#
	#
	# async def run_client():
	# uri = ("wss://gigaverse-ivrit-ai-streaming.hf.space/wtranscribe") # WebSocket URL
	# ssl_context = ssl.SSLContext(ssl.PROTOCOL_TLS_CLIENT)
	# ssl_context.check_hostname = False
	# ssl_context.verify_mode = ssl.CERT_NONE
	# while True:
	# try:
	# async with websockets.connect(uri, ssl=ssl_context, ping_timeout=1000, ping_interval=50) as websocket:
	# await asyncio.gather(
	# send_audio(websocket),
	# receive_transcription(websocket),
	# send_heartbeat(websocket)
	# )
	# except websockets.ConnectionClosedError as e:
	# print(f"WebSocket closed with error: {e}")
	# # except Exception as e:
	# # print(f"Unexpected error: {e}")
	# #
	# # print("Reconnecting in 5 seconds...")
	# # await asyncio.sleep(5) # Wait 5 seconds before reconnecting
	#
	# asyncio.run(run_client())