radarbackend11262024v11

Runtime error

Pijush2023 commited on Oct 25, 2024

Commit

a54b7bc

verified ·

1 Parent(s): 164b9f7

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -73,28 +73,20 @@ def transcribe_function(stream, new_chunk):
     if max_abs_y > 0:
         y = y / max_abs_y
-    # Concatenate the new chunk to the existing stream if available
-    stream = y if stream is None else np.concatenate([stream, y])
-    # Check if the stream is at least 7 seconds long
-    duration = len(stream) / sr
-    if duration >= 7:
-        # Process the audio data for transcription
-        result = pipe_asr({"array": stream, "sampling_rate": sr}, return_timestamps=False)
-        full_text = result.get("text", "")
-        print(f"Transcription: {full_text}")
-        # Retrieve hybrid response using Neo4j and other methods
-        response_text = retriever(full_text)
-        print(f"Response: {response_text}")
-        # Generate audio from the response text
-        audio_path = generate_audio_elevenlabs(response_text)
-        # Reset the stream for the next chunk and return the generated audio
-        return None, audio_path, full_text  # Clear the stream after processing
-    return stream, None, ""  # Continue streaming until 7 seconds is reached
@@ -226,9 +218,9 @@ def process_audio_query(audio_input):
 interface = gr.Interface(
     fn=process_audio_query,
     inputs=gr.Audio(sources="microphone", type="numpy",streaming=True),
-    outputs=gr.Audio(type="filepath", autoplay=True),
     description="Ask questions via audio and receive audio responses.",
-    allow_flagging="never"  # Disables the Clear button
 )
 # Launch the Gradio app

     if max_abs_y > 0:
         y = y / max_abs_y
+    # Ensure stream is also at least 1-dimensional before concatenation
+    if stream is not None and len(stream) > 0:
+        stream = np.concatenate([stream, y])
+    else:
+        stream = y
+    # Process the audio data for transcription
+    result = pipe_asr({"array": stream, "sampling_rate": sr}, return_timestamps=False)
+    full_text = result.get("text", "")
+    # Start a thread to reset the state after 10 seconds
+    threading.Thread(target=auto_reset_state).start()
+    return stream, full_text, full_text
 interface = gr.Interface(
     fn=process_audio_query,
     inputs=gr.Audio(sources="microphone", type="numpy",streaming=True),
+    outputs=gr.Audio(type="filepath", autoplay=True,interactive=False),
     description="Ask questions via audio and receive audio responses.",
+    #allow_flagging="never"  # Disables the Clear button
 )
 # Launch the Gradio app