whatsthispdf02

Running

mitulagr2 commited on Jun 6, 2024

Commit

ffe1a73

1 Parent(s): da60393

Update to phi3:mini

Files changed (2) hide show

app/rag.py CHANGED Viewed

@@ -15,11 +15,11 @@ class ChatPDF:
     chain = None
     def __init__(self):
-        self.model = ChatOllama(model="gemma:2b")
         self.text_splitter = RecursiveCharacterTextSplitter(chunk_size=128, chunk_overlap=8)
         self.prompt = PromptTemplate.from_template(
             """
-            <s> [INST] Use the pieces of context to answer the question concisely.[/INST] </s>
             [INST] Question: {question}
             Context: {context}
             Answer: [/INST]
@@ -35,7 +35,7 @@ class ChatPDF:
         self.retriever = vector_store.as_retriever(
             search_type="similarity_score_threshold",
             search_kwargs={
-                "k": 56,
                 "score_threshold": 0.5,
             },
         )

     chain = None
     def __init__(self):
+        self.model = ChatOllama(model="phi3:mini")
         self.text_splitter = RecursiveCharacterTextSplitter(chunk_size=128, chunk_overlap=8)
         self.prompt = PromptTemplate.from_template(
             """
+            <s> [INST] Use the context to answer the question.[/INST] </s>
             [INST] Question: {question}
             Context: {context}
             Answer: [/INST]
         self.retriever = vector_store.as_retriever(
             search_type="similarity_score_threshold",
             search_kwargs={
+                "k": 24,
                 "score_threshold": 0.5,
             },
         )

start_service.sh CHANGED Viewed

@@ -7,7 +7,7 @@ ollama serve &
 sleep 5
 # Pull and run <YOUR_MODEL_NAME>
-ollama pull gemma:2b
 #
 fastapi run /code/app/main.py --port 7860

 sleep 5
 # Pull and run <YOUR_MODEL_NAME>
+ollama pull phi3:mini
 #
 fastapi run /code/app/main.py --port 7860