Spaces:

NaimaAqeel
/

Chatbot

Runtime error

NaimaAqeel commited on Jun 4, 2024

Commit

cd89674

verified ·

1 Parent(s): e264586

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -76,7 +76,8 @@ else:
 def upload_files(files):
     global index, document_texts
     try:
-        for file_path in files:
             if file_path.endswith('.pdf'):
                 text = extract_text_from_pdf(file_path)
             elif file_path.endswith('.docx'):
@@ -84,9 +85,12 @@ def upload_files(files):
             else:
                 return "Unsupported file format"
             # Process the text and update FAISS index
             sentences = text.split("\n")
             embeddings = embedding_model.encode(sentences)
             index.add(np.array(embeddings))
             document_texts.append(text)
@@ -105,11 +109,15 @@ def upload_files(files):
 def query_text(text):
     try:
         # Encode the query text
         query_embedding = embedding_model.encode([text])
         # Search the FAISS index
         D, I = index.search(np.array(query_embedding), k=5)
         top_documents = []
         for idx in I[0]:
@@ -148,6 +156,7 @@ demo.launch()

 def upload_files(files):
     global index, document_texts
     try:
+        for file in files:
+            file_path = file.name  # Get the file path from the NamedString object
             if file_path.endswith('.pdf'):
                 text = extract_text_from_pdf(file_path)
             elif file_path.endswith('.docx'):
             else:
                 return "Unsupported file format"
+            print(f"Extracted text: {text[:100]}...")  # Debug: Show the first 100 characters of the extracted text
             # Process the text and update FAISS index
             sentences = text.split("\n")
             embeddings = embedding_model.encode(sentences)
+            print(f"Embeddings shape: {embeddings.shape}")  # Debug: Show the shape of the embeddings
             index.add(np.array(embeddings))
             document_texts.append(text)
 def query_text(text):
     try:
+        print(f"Query text: {text}")  # Debug: Show the query text
         # Encode the query text
         query_embedding = embedding_model.encode([text])
+        print(f"Query embedding shape: {query_embedding.shape}")  # Debug: Show the shape of the query embedding
         # Search the FAISS index
         D, I = index.search(np.array(query_embedding), k=5)
+        print(f"Distances: {D}, Indices: {I}")  # Debug: Show the distances and indices of the search results
         top_documents = []
         for idx in I[0]: