Spaces:

DrishtiSharma
/

chat-w-docs-via-speech-or-text

Sleeping

App Files Files Community

DrishtiSharma commited on Dec 9, 2024

Commit

abce794

verified ·

1 Parent(s): af77c7a

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -43

app.py CHANGED Viewed

@@ -10,6 +10,7 @@ from langchain_groq import ChatGroq
 from langchain.memory import ConversationBufferMemory
 from langchain.chains import ConversationalRetrievalChain
 from PyPDF2 import PdfReader
 from groq import Groq
 # Clear ChromaDB cache to fix tenant issue
@@ -18,7 +19,7 @@ chromadb.api.client.SharedSystemClient.clear_system_cache()
 # Ensure required environment variables are set
 GROQ_API_KEY = os.getenv("GROQ_API_KEY")
 if not GROQ_API_KEY:
-    st.error("GROQ_API_KEY is not set. Please configure it in Hugging Face Spaces secrets.")
     st.stop()
 # Initialize Groq Client for transcription and LLM
@@ -52,43 +53,21 @@ def chat_chain(vectorstore):
     )
     return chain
-# JavaScript for recording audio
-RECORD_JS = """
-const sleep = time => new Promise(resolve => setTimeout(resolve, time));
-const b2text = blob => new Promise(resolve => {
-    const reader = new FileReader();
-    reader.onloadend = e => resolve(e.srcElement.result);
-    reader.readAsDataURL(blob);
-});
-var record = time => new Promise(async resolve => {
-    stream = await navigator.mediaDevices.getUserMedia({ audio: true });
-    recorder = new MediaRecorder(stream);
-    chunks = [];
-    recorder.ondataavailable = e => chunks.push(e.data);
-    recorder.start();
-    await sleep(time);
-    recorder.onstop = async () => {
-        blob = new Blob(chunks);
-        text = await b2text(blob);
-        resolve(text);
-    };
-    recorder.stop();
-});
-"""
-def record_audio(seconds=5):
-    """Record audio via JavaScript and save it as a .wav file."""
-    st.write("Recording audio...")
-    from streamlit.components.v1 import html
-    audio_b64 = st.experimental_js("record", seconds * 1000)
-    audio_bytes = b64decode(audio_b64.split(",")[1])
-    audio_file_path = "recorded_audio.wav"
-    with open(audio_file_path, "wb") as f:
-        f.write(audio_bytes)
-    return audio_file_path
 def transcribe_audio(file_path):
-    """Transcribe audio using Groq Whisper."""
     with open(file_path, "rb") as file:
         transcription = groq_client.audio.transcriptions.create(
             file=(file_path, file.read()),
@@ -120,16 +99,13 @@ if uploaded_files:
     # Audio Input Mode
     elif input_method == "Audio Input":
-        if st.button("Record Audio"):
-            audio_file = record_audio(5)
-            st.audio(audio_file)
-            # Transcription
             st.write("Transcribing audio...")
             transcription = transcribe_audio(audio_file)
             st.write(f"**You said:** {transcription}")
-            # Generate Response
             with st.spinner("Generating response..."):
                 response = chain({"question": transcription})["answer"]
                 st.write(f"**Response:** {response}")

 from langchain.memory import ConversationBufferMemory
 from langchain.chains import ConversationalRetrievalChain
 from PyPDF2 import PdfReader
+from streamlit_audio_recorder import st_audio_recorder
 from groq import Groq
 # Clear ChromaDB cache to fix tenant issue
 # Ensure required environment variables are set
 GROQ_API_KEY = os.getenv("GROQ_API_KEY")
 if not GROQ_API_KEY:
+    st.error("GROQ_API_KEY is not set. Please configure it in your environment variables.")
     st.stop()
 # Initialize Groq Client for transcription and LLM
     )
     return chain
+# Function to record audio using streamlit_audio_recorder
+def record_audio():
+    st.write("Click below to record your audio:")
+    audio_bytes = st_audio_recorder()
+    if audio_bytes:
+        audio_file_path = "recorded_audio.wav"
+        with open(audio_file_path, "wb") as f:
+            f.write(audio_bytes)
+        st.success("Audio recorded successfully!")
+        return audio_file_path
+    return None
+# Transcribe audio using Groq Whisper
 def transcribe_audio(file_path):
+    """Transcribe audio using Groq's Whisper model."""
     with open(file_path, "rb") as file:
         transcription = groq_client.audio.transcriptions.create(
             file=(file_path, file.read()),
     # Audio Input Mode
     elif input_method == "Audio Input":
+        audio_file = record_audio()
+        if audio_file:
+            st.audio(audio_file, format="audio/wav")
             st.write("Transcribing audio...")
             transcription = transcribe_audio(audio_file)
             st.write(f"**You said:** {transcription}")
             with st.spinner("Generating response..."):
                 response = chain({"question": transcription})["answer"]
                 st.write(f"**Response:** {response}")