Spaces:

Gigaverse
/

ivrit-ai-streaming

Sleeping

App Files Files Community

AshDavid12 commited on Sep 12, 2024

Commit

cf31b20

1 Parent(s): ebaaf9b

close exec change

Browse files

Files changed (2) hide show

client.py +9 -2
infer.py +4 -5

client.py CHANGED Viewed

@@ -7,6 +7,7 @@ SAMPLE_RATE = 16000
 CHUNK_SIZE = 1024  # Size of the audio chunk sent at a time
 AUDIO_FILE = "https://raw.githubusercontent.com/AshDavid12/hugging_face_ivrit_streaming/main/test_copy.mp3"  # Path to the mp3 file
 async def send_audio(websocket):
     with wave.open(AUDIO_FILE, "rb") as wf:
         data = wf.readframes(CHUNK_SIZE)
@@ -15,6 +16,7 @@ async def send_audio(websocket):
             await asyncio.sleep(CHUNK_SIZE / SAMPLE_RATE)  # Simulate real-time by waiting for the duration of the chunk
             data = wf.readframes(CHUNK_SIZE)
 async def receive_transcription(websocket):
     while True:
         try:
@@ -24,9 +26,14 @@ async def receive_transcription(websocket):
             print(f"Error: {e}")
             break
 async def run_client():
-    uri = "wss://gigaverse-ivrit-ai-streaming.hf.space/ws/transcribe"  # Replace with your Hugging Face Space WebSocket URL
-    async with websockets.connect(uri) as websocket:
         await asyncio.gather(
             send_audio(websocket),
             receive_transcription(websocket)

 CHUNK_SIZE = 1024  # Size of the audio chunk sent at a time
 AUDIO_FILE = "https://raw.githubusercontent.com/AshDavid12/hugging_face_ivrit_streaming/main/test_copy.mp3"  # Path to the mp3 file
 async def send_audio(websocket):
     with wave.open(AUDIO_FILE, "rb") as wf:
         data = wf.readframes(CHUNK_SIZE)
             await asyncio.sleep(CHUNK_SIZE / SAMPLE_RATE)  # Simulate real-time by waiting for the duration of the chunk
             data = wf.readframes(CHUNK_SIZE)
 async def receive_transcription(websocket):
     while True:
         try:
             print(f"Error: {e}")
             break
+import ssl
 async def run_client():
+    uri = ("wss://gigaverse-ivrit-ai-streaming.hf.space/ws/transcribe")  # Replace with your Hugging Face Space WebSocket URL
+    ssl_context = ssl.SSLContext(ssl.PROTOCOL_TLS_CLIENT)
+    ssl_context.check_hostname = False
+    ssl_context.verify_mode = ssl.CERT_NONE
+    async with websockets.connect(uri, ssl=ssl_context) as websocket:
         await asyncio.gather(
             send_audio(websocket),
             receive_transcription(websocket)

infer.py CHANGED Viewed

@@ -12,7 +12,7 @@ from typing import Optional
 import asyncio
 # Configure logging
-logging.basicConfig(level=logging.DEBUG, format='%(asctime)s - %(levelname)s - %(message)s')
 device = 'cuda' if torch.cuda.is_available() else 'cpu'
 logging.info(f'Device selected: {device}')
@@ -159,11 +159,11 @@ def transcribe_core_ws(audio_file, last_transcribed_time):
     # Track the new segments and update the last transcribed time
     for s in segs:
-        logging.debug(f"Processing segment with start time: {s.start} and end time: {s.end}")
         # Only process segments that start after the last transcribed time
         if s.start >= last_transcribed_time:
-            logging.debug(f"New segment found starting at {s.start} seconds.")
             words = [{'start': w.start, 'end': w.end, 'word': w.word, 'probability': w.probability} for w in s.words]
             seg = {
@@ -203,7 +203,7 @@ async def websocket_transcribe(websocket: WebSocket):
             # Continuously receive and process audio chunks
             while True:
                 try:
-                    logging.debug("Waiting to receive the next chunk of audio data from WebSocket.")
                     # Receive the next chunk of audio data
                     audio_chunk = await websocket.receive_bytes()
@@ -243,7 +243,6 @@ async def websocket_transcribe(websocket: WebSocket):
         await websocket.send_json({"error": str(e)})
     finally:
         logging.info("Cleaning up and closing WebSocket connection.")
-        await websocket.close()

 import asyncio
 # Configure logging
+logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 device = 'cuda' if torch.cuda.is_available() else 'cpu'
 logging.info(f'Device selected: {device}')
     # Track the new segments and update the last transcribed time
     for s in segs:
+        logging.info(f"Processing segment with start time: {s.start} and end time: {s.end}")
         # Only process segments that start after the last transcribed time
         if s.start >= last_transcribed_time:
+            logging.info(f"New segment found starting at {s.start} seconds.")
             words = [{'start': w.start, 'end': w.end, 'word': w.word, 'probability': w.probability} for w in s.words]
             seg = {
             # Continuously receive and process audio chunks
             while True:
                 try:
+                    logging.info("Waiting to receive the next chunk of audio data from WebSocket.")
                     # Receive the next chunk of audio data
                     audio_chunk = await websocket.receive_bytes()
         await websocket.send_json({"error": str(e)})
     finally:
         logging.info("Cleaning up and closing WebSocket connection.")