Spaces:

jaafarhh
/

DarijaTherapy

Sleeping

App Files Files Community

jaafarhh commited on Dec 1, 2024

Commit

09618ca

verified ·

1 Parent(s): 719f101

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -22

app.py CHANGED Viewed

@@ -4,19 +4,19 @@ import torchaudio
 import soundfile as sf
 from pathlib import Path
 from transformers import pipeline, AutoTokenizer
 from langchain.memory import ConversationBufferMemory
 from langchain.chains import ConversationalRetrievalChain
-from langchain_community.llms import HuggingFaceHub
-from langchain_community.embeddings import HuggingFaceEmbeddings
 from langchain_community.vectorstores import FAISS
-from langchain_core.prompts import PromptTemplate
 import os
 from dotenv import load_dotenv
 # Load environment variables
 load_dotenv()
-# CSS remains the same
 css = """
 <style>
 .chat-message { padding: 1.5rem; border-radius: 0.5rem; margin-bottom: 1rem; display: flex; }
@@ -27,17 +27,20 @@ css = """
 </style>
 """
-# Updated prompt template with correct variables
 PROMPT_TEMPLATE = """
 You are a professional therapist who speaks Moroccan Arabic (Darija).
 Respond with empathy and use therapeutic techniques.
 Always respond in Darija unless specifically asked to use another language.
-Context: {context}
-Chat History: {chat_history}
-Current Question: {question}
-Therapeutic response:
 """
 class DarijaTherapist:
@@ -48,8 +51,8 @@ class DarijaTherapist:
     def setup_models(self):
         try:
             tokenizer = AutoTokenizer.from_pretrained("facebook/seamless-m4t-v2-large")
             self.device = "cuda" if torch.cuda.is_available() else "cpu"
             self.asr_pipe = pipeline(
                 "automatic-speech-recognition",
@@ -58,17 +61,25 @@ class DarijaTherapist:
                 device=self.device
             )
-            self.llm = HuggingFaceHub(
-                repo_id="MBZUAI-Paris/Atlas-Chat-9B",
-                model_kwargs={"temperature": 0.7, "max_length": 512, "torch_dtype": torch.bfloat16, "do_sample": True},
-                device="cuda",
                 huggingfacehub_api_token=os.getenv("HUGGINGFACE_API_TOKEN")
             )
-            self.embeddings = HuggingFaceEmbeddings(
-                model_name="sentence-transformers/all-mpnet-base-v2"
             )
             self.vectorstore = FAISS.from_texts(
                 ["Initial therapeutic context"],
                 self.embeddings
@@ -76,14 +87,13 @@ class DarijaTherapist:
         except Exception as e:
             st.error(f"Error setting up models: {str(e)}")
             st.stop()
     def setup_memory(self):
         self.memory = ConversationBufferMemory(
             memory_key="chat_history",
             return_messages=True
         )
-        # Updated chain creation with correct prompt
         qa_prompt = PromptTemplate(
             template=PROMPT_TEMPLATE,
             input_variables=["context", "chat_history", "question"]
@@ -94,11 +104,9 @@ class DarijaTherapist:
             retriever=self.vectorstore.as_retriever(),
             memory=self.memory,
             combine_docs_chain_kwargs={"prompt": qa_prompt},
-            return_source_documents=True,
-            chain_type="stuff"
         )
-    # Rest of the methods remain the same
     def initialize_session_state(self):
         if "messages" not in st.session_state:
             st.session_state.messages = []
@@ -138,7 +146,10 @@ class DarijaTherapist:
     def get_ai_response(self, user_input):
         try:
-            response = self.conversation_chain({"question": user_input})
             return response['answer']
         except Exception as e:
             st.error(f"Error getting AI response: {str(e)}")

 import soundfile as sf
 from pathlib import Path
 from transformers import pipeline, AutoTokenizer
+from langchain_community.llms import HuggingFaceEndpoint
+from langchain_community.embeddings import HuggingFaceBgeEmbeddings
 from langchain.memory import ConversationBufferMemory
 from langchain.chains import ConversationalRetrievalChain
 from langchain_community.vectorstores import FAISS
+from langchain.prompts import PromptTemplate
 import os
 from dotenv import load_dotenv
 # Load environment variables
 load_dotenv()
+# CSS styling
 css = """
 <style>
 .chat-message { padding: 1.5rem; border-radius: 0.5rem; margin-bottom: 1rem; display: flex; }
 </style>
 """
+# Prompt template
 PROMPT_TEMPLATE = """
 You are a professional therapist who speaks Moroccan Arabic (Darija).
 Respond with empathy and use therapeutic techniques.
 Always respond in Darija unless specifically asked to use another language.
+Previous conversation:
+{chat_history}
+User message: {question}
+Additional context: {context}
+Therapeutic response in Darija:
 """
 class DarijaTherapist:
     def setup_models(self):
         try:
+            # Speech recognition setup
             tokenizer = AutoTokenizer.from_pretrained("facebook/seamless-m4t-v2-large")
             self.device = "cuda" if torch.cuda.is_available() else "cpu"
             self.asr_pipe = pipeline(
                 "automatic-speech-recognition",
                 device=self.device
             )
+            # LLM setup
+            self.llm = HuggingFaceEndpoint(
+                endpoint_url="https://api-inference.huggingface.co/models/MBZUAI-Paris/Atlas-Chat-9B",
+                task="text-generation",
+                model_kwargs={
+                    "temperature": 0.7,
+                    "max_length": 512,
+                    "do_sample": True,
+                    "return_full_text": False
+                },
                 huggingfacehub_api_token=os.getenv("HUGGINGFACE_API_TOKEN")
             )
+            # Embeddings setup
+            self.embeddings = HuggingFaceBgeEmbeddings(
+                model_name="BAAI/bge-large-en"
             )
+            # Vector store setup
             self.vectorstore = FAISS.from_texts(
                 ["Initial therapeutic context"],
                 self.embeddings
         except Exception as e:
             st.error(f"Error setting up models: {str(e)}")
             st.stop()
     def setup_memory(self):
         self.memory = ConversationBufferMemory(
             memory_key="chat_history",
             return_messages=True
         )
         qa_prompt = PromptTemplate(
             template=PROMPT_TEMPLATE,
             input_variables=["context", "chat_history", "question"]
             retriever=self.vectorstore.as_retriever(),
             memory=self.memory,
             combine_docs_chain_kwargs={"prompt": qa_prompt},
+            return_source_documents=True
         )
     def initialize_session_state(self):
         if "messages" not in st.session_state:
             st.session_state.messages = []
     def get_ai_response(self, user_input):
         try:
+            response = self.conversation_chain({
+                "question": user_input,
+                "chat_history": self.memory.chat_memory.messages
+            })
             return response['answer']
         except Exception as e:
             st.error(f"Error getting AI response: {str(e)}")