Spaces:

MaryamKarimi080
/

SCR_Course_ChatBot

Paused

App Files Files Community

MaryamKarimi080 commited on 14 days ago

Commit

6ca7edb

verified ·

1 Parent(s): 18a6316

Update scripts/rag_chat.py

Browse files

Files changed (1) hide show

scripts/rag_chat.py +42 -36

scripts/rag_chat.py CHANGED Viewed

@@ -1,36 +1,42 @@
-from langchain.chains import RetrievalQA
-from langchain_openai import ChatOpenAI
-from langchain_chroma import Chroma
-from langchain_openai import OpenAIEmbeddings
-from langchain.prompts import PromptTemplate
-from pathlib import Path
-BASE_DIR = Path(__file__).resolve().parent.parent
-DB_DIR = str(BASE_DIR / "db")
-def build_general_qa_chain(model_name=None):
-    embedding = OpenAIEmbeddings(model="text-embedding-3-small")
-    vectorstore = Chroma(persist_directory=DB_DIR, embedding_function=embedding)
-    # Custom prompt with source attribution
-    template = """Use the following context to answer the question.
-    If the answer isn't found in the context, use your general knowledge but say so.
-    Always cite your sources at the end with 'Source: <filename>' when using course materials.
-    Context: {context}
-    Question: {question}
-    Helpful Answer:"""
-    QA_PROMPT = PromptTemplate(
-        template=template,
-        input_variables=["context", "question"]
-    )
-    llm = ChatOpenAI(model_name=model_name or "gpt-4o-mini", temperature=0.0)
-    qa_chain = RetrievalQA.from_chain_type(
-        llm=llm,
-        retriever=vectorstore.as_retriever(search_kwargs={"k": 4}),
-        chain_type_kwargs={"prompt": QA_PROMPT},
-        return_source_documents=True
-    )
-    return qa_chain

+import os
+from pathlib import Path
+from langchain.chains import RetrievalQA
+from langchain_openai import ChatOpenAI, OpenAIEmbeddings
+from langchain_chroma import Chroma
+from langchain.prompts import PromptTemplate
+BASE_DIR = Path(__file__).resolve().parent.parent
+DB_DIR = BASE_DIR / "db"
+def build_general_qa_chain(model_name=None):
+    if not DB_DIR.exists():
+        print("📦 No DB found. Building vectorstore...")
+        from scripts import load_documents, chunk_and_embed, setup_vectorstore
+        load_documents.main()
+        chunk_and_embed.main()
+        setup_vectorstore.main()
+    embedding = OpenAIEmbeddings(model="text-embedding-3-small")
+    vectorstore = Chroma(persist_directory=str(DB_DIR), embedding_function=embedding)
+    template = """Use the following context to answer the question.
+    If the answer isn't found in the context, use your general knowledge but say so.
+    Always cite your sources at the end with 'Source: <filename>' when using course materials.
+    Context: {context}
+    Question: {question}
+    Helpful Answer:"""
+    QA_PROMPT = PromptTemplate(
+        template=template,
+        input_variables=["context", "question"]
+    )
+    llm = ChatOpenAI(model_name=model_name or "gpt-4o-mini", temperature=0.0)
+    qa_chain = RetrievalQA.from_chain_type(
+        llm=llm,
+        retriever=vectorstore.as_retriever(search_kwargs={"k": 4}),
+        chain_type_kwargs={"prompt": QA_PROMPT},
+        return_source_documents=True
+    )
+    return qa_chain