Spaces:

Poojashetty357
/

RAG-Bot

Sleeping

App Files Files Community

Poojashetty357 commited on Jun 2

Commit

e772da6

verified ·

1 Parent(s): 2d85011

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -14

app.py CHANGED Viewed

@@ -1,20 +1,28 @@
 import gradio as gr
-from llama_index.core import VectorStoreIndex, SimpleDirectoryReader
 import os
-# Load and index Paul Graham documents
-pg_docs = SimpleDirectoryReader("data/paul").load_data()
-pg_docs = [doc for doc in pg_docs if doc.text and doc.text.strip()]
-pg_index = VectorStoreIndex.from_documents(pg_docs)
 pg_engine = pg_index.as_query_engine()
-# Load and index Insurance documents
-ins_docs = SimpleDirectoryReader("data/insurance").load_data()
-ins_docs = [doc for doc in ins_docs if doc.text and doc.text.strip()]
-ins_index = VectorStoreIndex.from_documents(ins_docs)
 ins_engine = ins_index.as_query_engine()
-# Query functions with input validation
 def query_pg(query):
     if not query.strip():
         return "❌ Please enter a valid question before submitting."
@@ -31,7 +39,7 @@ def query_ins(query):
     except Exception as e:
         return f"❌ Error: {str(e)}"
-# Predefined questions
 paul_questions = [
     "What is the main purpose of writing, according to Paul Graham?",
     "Why do students often struggle with writing in school?",
@@ -48,7 +56,7 @@ insurance_questions = [
     "What should you check before buying insurance?"
 ]
-# UI
 def launch_interface():
     with gr.Blocks(
         title="RAG App",
@@ -65,7 +73,7 @@ def launch_interface():
         gr.Markdown("""
             <div id='header-text'>
-                <h1>RAG Bot with LlamaIndex</h1>
             </div>
         """)
@@ -116,4 +124,4 @@ def launch_interface():
     demo.launch()
 if __name__ == "__main__":
-    launch_interface()

 import gradio as gr
 import os
+from llama_index.core import VectorStoreIndex, SimpleDirectoryReader, ServiceContext
+from llama_index.embeddings.huggingface import HuggingFaceEmbedding
+# ✅ Use Hugging Face embedding model
+embed_model = HuggingFaceEmbedding(model_name="sentence-transformers/all-MiniLM-L6-v2")
+service_context = ServiceContext.from_defaults(embed_model=embed_model)
+# ✅ Helper to load and filter documents
+def load_filtered_docs(folder):
+    docs = SimpleDirectoryReader(folder).load_data()
+    return [doc for doc in docs if doc.text and doc.text.strip()]
+# ✅ Load and index Paul Graham documents
+pg_docs = load_filtered_docs("data/paul")
+pg_index = VectorStoreIndex.from_documents(pg_docs, service_context=service_context)
 pg_engine = pg_index.as_query_engine()
+# ✅ Load and index Insurance documents (PDF included)
+ins_docs = load_filtered_docs("data/insurance")
+ins_index = VectorStoreIndex.from_documents(ins_docs, service_context=service_context)
 ins_engine = ins_index.as_query_engine()
+# ✅ Query functions
 def query_pg(query):
     if not query.strip():
         return "❌ Please enter a valid question before submitting."
     except Exception as e:
         return f"❌ Error: {str(e)}"
+# ✅ Predefined questions
 paul_questions = [
     "What is the main purpose of writing, according to Paul Graham?",
     "Why do students often struggle with writing in school?",
     "What should you check before buying insurance?"
 ]
+# ✅ Gradio Interface
 def launch_interface():
     with gr.Blocks(
         title="RAG App",
         gr.Markdown("""
             <div id='header-text'>
+                <h1>RAG Bot with LlamaIndex (PDF + TXT)</h1>
             </div>
         """)
     demo.launch()
 if __name__ == "__main__":
+    launch_interface()