Spaces:

stephaniek791
/

RAG_PEDIATRICS

Paused

Stéphanie Kamgnia Wonkap commited on Nov 12, 2024

Commit

4a793d8

1 Parent(s): 0a78a57

fixing main

Files changed (1) hide show

app.py CHANGED Viewed

@@ -67,7 +67,7 @@ def main():
     embedding_model=init_embedding_model(EMBEDDING_MODEL_NAME)
     if os.path.exists(VECTORDB_PATH):
-        new_vector_store = FAISS.load_local(
             VECTORDB_PATH, embedding_model,
             allow_dangerous_deserialization=True)
     else:
@@ -78,11 +78,11 @@ def main():
     if st.button("Get Answer"):
     # Get the answer and relevant documents
         bnb_config = BitsAndBytesConfig(
-            load_in_8bit=True
-            #load_in_4bit=True,
-            #bnb_4bit_use_double_quant=True,
-            #bnb_4bit_quant_type="nf4",
-            #bnb_4bit_compute_dtype=torch.bfloat16,
         )
         model = AutoModelForCausalLM.from_pretrained(READER_MODEL_NAME, quantization_config=bnb_config,
             device_map = 'auto')

     embedding_model=init_embedding_model(EMBEDDING_MODEL_NAME)
     if os.path.exists(VECTORDB_PATH):
+        KNOWLEDGE_VECTOR_DATABASE = FAISS.load_local(
             VECTORDB_PATH, embedding_model,
             allow_dangerous_deserialization=True)
     else:
     if st.button("Get Answer"):
     # Get the answer and relevant documents
         bnb_config = BitsAndBytesConfig(
+            #load_in_8bit=True
+            load_in_4bit=True,
+            bnb_4bit_use_double_quant=True,
+            bnb_4bit_quant_type="nf4",
+            bnb_4bit_compute_dtype=torch.bfloat16,
         )
         model = AutoModelForCausalLM.from_pretrained(READER_MODEL_NAME, quantization_config=bnb_config,
             device_map = 'auto')