Spaces:

spark-ds549
/

LibRAG

Sleeping

Dephoh commited on Dec 10, 2024

Commit

16f0715

1 Parent(s): bfbadc3

moved vectorstore initialization outside of RAG

Files changed (2) hide show

RAG.py CHANGED Viewed

@@ -15,15 +15,15 @@ from typing import Dict, Any, Optional, List, Tuple
 import json
 import logging
-def retrieve(index_name: str, query: str, embeddings, k: int = 1000) -> Tuple[List[Document], List[float]]:
     start = time.time()
     load_dotenv()
-    pinecone_api_key = os.getenv("PINECONE_API_KEY")
-    pc = Pinecone(api_key=pinecone_api_key)
-    index = pc.Index(index_name)
-    vector_store = PineconeVectorStore(index=index, embedding=embeddings)
-    results = vector_store.similarity_search_with_score(
         query,
         k=k,
     )
@@ -118,7 +118,7 @@ def parse_xml_and_check(xml_string: str) -> str:
     return parsed_response.get('RESPONSE', "No response found in the output")
-def RAG(llm: Any, query: str, index_name: str, embeddings: Any, top: int = 10, k: int = 100) -> Tuple[str, List[Document]]:
     """Main RAG function with improved error handling and validation."""
     start = time.time()
     try:
@@ -154,7 +154,7 @@ def RAG(llm: Any, query: str, index_name: str, embeddings: Any, top: int = 10, k
         new_query = parse_xml_and_query(query=query,xml_string=query_response.content)
         print(f"New_Query: {new_query}")
-        retrieved, _ = retrieve(index_name=index_name, query=new_query, embeddings=embeddings, k=k)
         if not retrieved:
             return "No documents found for your query.", []

 import json
 import logging
+def retrieve(query: str,vectorstore:PineconeVectorStore, k: int = 1000) -> Tuple[List[Document], List[float]]:
     start = time.time()
     load_dotenv()
+    # pinecone_api_key = os.getenv("PINECONE_API_KEY")
+    # pc = Pinecone(api_key=pinecone_api_key)
+    # index = pc.Index(index_name)
+    # vector_store = PineconeVectorStore(index=index, embedding=embeddings)
+    results = vectorstore.similarity_search_with_score(
         query,
         k=k,
     )
     return parsed_response.get('RESPONSE', "No response found in the output")
+def RAG(llm: Any, query: str, index_name: str, embeddings: Any,vectorstore:PineconeVectorStore, top: int = 10, k: int = 100) -> Tuple[str, List[Document]]:
     """Main RAG function with improved error handling and validation."""
     start = time.time()
     try:
         new_query = parse_xml_and_query(query=query,xml_string=query_response.content)
         print(f"New_Query: {new_query}")
+        retrieved, _ = retrieve(query=new_query, vectorstore=vectorstore, k=k)
         if not retrieved:
             return "No documents found for your query.", []

streamlit_app.py CHANGED Viewed

@@ -50,7 +50,9 @@ def process_message(
     query: str,
     llm: ChatOpenAI,
     index_name: str,
-    embeddings: HuggingFaceEmbeddings
 ) -> Tuple[str, List]:
     """Process the user message using the RAG system."""
     try:
@@ -58,7 +60,8 @@ def process_message(
             query=query,
             llm=llm,
             index_name=index_name,
-            embeddings=embeddings
         )
         return response, sources
     except Exception as e:
@@ -89,6 +92,10 @@ def display_sources(sources: List) -> None:
 def main():
     st.title("RAG Chatbot")
     # Initialize session state
     if "messages" not in st.session_state:
         st.session_state.messages = []
@@ -99,8 +106,11 @@ def main():
         st.error("Failed to initialize the application. Please check the logs.")
         return
-    # Constants
-    INDEX_NAME = 'bpl-rag'
     # Display chat history
     for message in st.session_state.messages:
@@ -122,7 +132,8 @@ def main():
                     query=user_input,
                     llm=llm,
                     index_name=INDEX_NAME,
-                    embeddings=embeddings
                 )
                 if isinstance(response, str):

     query: str,
     llm: ChatOpenAI,
     index_name: str,
+    embeddings: HuggingFaceEmbeddings,
+    vectorstore: PineconeVectorStore,
 ) -> Tuple[str, List]:
     """Process the user message using the RAG system."""
     try:
             query=query,
             llm=llm,
             index_name=index_name,
+            embeddings=embeddings,
+            vectorstore=vectorstore,
         )
         return response, sources
     except Exception as e:
 def main():
     st.title("RAG Chatbot")
+    INDEX_NAME = 'bpl-rag'
+    pinecone_api_key = os.getenv("PINECONE_API_KEY")
     # Initialize session state
     if "messages" not in st.session_state:
         st.session_state.messages = []
         st.error("Failed to initialize the application. Please check the logs.")
         return
+    #initialize vectorstore
+    pc = Pinecone(api_key=pinecone_api_key)
+    index = pc.Index(INDEX_NAME)
+    vector_store = PineconeVectorStore(index=index, embedding=embeddings)
     # Display chat history
     for message in st.session_state.messages:
                     query=user_input,
                     llm=llm,
                     index_name=INDEX_NAME,
+                    embeddings=embeddings,
+                    vectorstore=vector_store
                 )
                 if isinstance(response, str):