Added debugging logs for context
Browse files- app/main.py +8 -2
app/main.py
CHANGED
@@ -140,7 +140,7 @@ def extract_text_from_pdf(pdf_path):
|
|
140 |
|
141 |
return text.strip()
|
142 |
|
143 |
-
def split_text_into_chunks(text, source_file, chunk_size=
|
144 |
# Clean the text
|
145 |
text = text.strip().replace('\n', ' ').replace(' ', ' ')
|
146 |
|
@@ -202,7 +202,7 @@ def create_faiss_index(texts, embedding_model):
|
|
202 |
index.add(np.array(doc_embeddings))
|
203 |
return index
|
204 |
|
205 |
-
def retrieve_documents(query, index, embedding_model, documents, top_k=
|
206 |
query_lower = query.lower()
|
207 |
target_topic = None
|
208 |
|
@@ -270,6 +270,12 @@ def generate_response_with_rag(prompt, index, embedding_model, documents, settin
|
|
270 |
# Retrieve relevant documents
|
271 |
retrieved_context = retrieve_documents(prompt, index, embedding_model, documents)
|
272 |
|
|
|
|
|
|
|
|
|
|
|
|
|
273 |
style_instructions = {
|
274 |
"simple": "Toa majibu rahisi na yanayoeleweka kwa urahisi, ukitumia maneno ya kawaida na sentensi fupi. Eleza dhana kama vile unazungumza na mwanafunzi mdogo.",
|
275 |
"creative": "Toa majibu ya kubunifu na yanayovutia, ukitumia mifano halisi na michoro ili kufanya maudhui yawe ya kuvutia na kukumbukika zaidi.",
|
|
|
140 |
|
141 |
return text.strip()
|
142 |
|
143 |
+
def split_text_into_chunks(text, source_file, chunk_size=500, overlap=50):
|
144 |
# Clean the text
|
145 |
text = text.strip().replace('\n', ' ').replace(' ', ' ')
|
146 |
|
|
|
202 |
index.add(np.array(doc_embeddings))
|
203 |
return index
|
204 |
|
205 |
+
def retrieve_documents(query, index, embedding_model, documents, top_k=5):
|
206 |
query_lower = query.lower()
|
207 |
target_topic = None
|
208 |
|
|
|
270 |
# Retrieve relevant documents
|
271 |
retrieved_context = retrieve_documents(prompt, index, embedding_model, documents)
|
272 |
|
273 |
+
# Log the retrieved context
|
274 |
+
logger.info("Context sent to model:")
|
275 |
+
logger.info("-" * 50)
|
276 |
+
logger.info(retrieved_context)
|
277 |
+
logger.info("-" * 50)
|
278 |
+
|
279 |
style_instructions = {
|
280 |
"simple": "Toa majibu rahisi na yanayoeleweka kwa urahisi, ukitumia maneno ya kawaida na sentensi fupi. Eleza dhana kama vile unazungumza na mwanafunzi mdogo.",
|
281 |
"creative": "Toa majibu ya kubunifu na yanayovutia, ukitumia mifano halisi na michoro ili kufanya maudhui yawe ya kuvutia na kukumbukika zaidi.",
|