AK1239 commited on
Commit
18e2f64
·
1 Parent(s): 86e2f15

Added debugging logs for context

Browse files
Files changed (1) hide show
  1. app/main.py +8 -2
app/main.py CHANGED
@@ -140,7 +140,7 @@ def extract_text_from_pdf(pdf_path):
140
 
141
  return text.strip()
142
 
143
- def split_text_into_chunks(text, source_file, chunk_size=750, overlap=50):
144
  # Clean the text
145
  text = text.strip().replace('\n', ' ').replace(' ', ' ')
146
 
@@ -202,7 +202,7 @@ def create_faiss_index(texts, embedding_model):
202
  index.add(np.array(doc_embeddings))
203
  return index
204
 
205
- def retrieve_documents(query, index, embedding_model, documents, top_k=3):
206
  query_lower = query.lower()
207
  target_topic = None
208
 
@@ -270,6 +270,12 @@ def generate_response_with_rag(prompt, index, embedding_model, documents, settin
270
  # Retrieve relevant documents
271
  retrieved_context = retrieve_documents(prompt, index, embedding_model, documents)
272
 
 
 
 
 
 
 
273
  style_instructions = {
274
  "simple": "Toa majibu rahisi na yanayoeleweka kwa urahisi, ukitumia maneno ya kawaida na sentensi fupi. Eleza dhana kama vile unazungumza na mwanafunzi mdogo.",
275
  "creative": "Toa majibu ya kubunifu na yanayovutia, ukitumia mifano halisi na michoro ili kufanya maudhui yawe ya kuvutia na kukumbukika zaidi.",
 
140
 
141
  return text.strip()
142
 
143
+ def split_text_into_chunks(text, source_file, chunk_size=500, overlap=50):
144
  # Clean the text
145
  text = text.strip().replace('\n', ' ').replace(' ', ' ')
146
 
 
202
  index.add(np.array(doc_embeddings))
203
  return index
204
 
205
+ def retrieve_documents(query, index, embedding_model, documents, top_k=5):
206
  query_lower = query.lower()
207
  target_topic = None
208
 
 
270
  # Retrieve relevant documents
271
  retrieved_context = retrieve_documents(prompt, index, embedding_model, documents)
272
 
273
+ # Log the retrieved context
274
+ logger.info("Context sent to model:")
275
+ logger.info("-" * 50)
276
+ logger.info(retrieved_context)
277
+ logger.info("-" * 50)
278
+
279
  style_instructions = {
280
  "simple": "Toa majibu rahisi na yanayoeleweka kwa urahisi, ukitumia maneno ya kawaida na sentensi fupi. Eleza dhana kama vile unazungumza na mwanafunzi mdogo.",
281
  "creative": "Toa majibu ya kubunifu na yanayovutia, ukitumia mifano halisi na michoro ili kufanya maudhui yawe ya kuvutia na kukumbukika zaidi.",