Spaces:

veerukhannan
/

advisor

Sleeping

App Files Files Community

veerukhannan commited on Nov 22, 2024

Commit

a53e1b6

verified ·

1 Parent(s): 38dd749

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -18

app.py CHANGED Viewed

@@ -8,6 +8,7 @@ from astrapy.db import AstraDB
 from dotenv import load_dotenv
 from huggingface_hub import login
 from sentence_transformers import SentenceTransformer
 # Load environment variables
 load_dotenv()
@@ -68,16 +69,45 @@ class LegalTextSearchBot:
             # Generate embedding for the query
             query_embedding = self.embedding_model.encode(query).tolist()
-            # Perform vector search in AstraDB
-            results = self.collection.vector_find(
                 query_embedding,
-                limit=5
-            )
-            return list(results)
         except Exception as e:
             print(f"Error searching AstraDB: {str(e)}")
             return []
     def search_sections(self, query: str) -> Tuple[str, str]:
         """Search legal sections and return both raw results and AI interpretation"""
         try:
@@ -85,24 +115,24 @@ class LegalTextSearchBot:
             search_results = self._search_astra(query)
             if not search_results:
-                return "No relevant sections found.", ""
             # Format raw results
             raw_results = []
             for result in search_results:
-                section_info = f"""
-                Section {result.get('section_number')}: {result.get('title')}
-                Chapter: {result.get('chapter_info', {}).get('title', 'N/A')}
-                Content:
-                {result.get('content', 'N/A')}
-                {"="*80}
-                """
-                raw_results.append(section_info)
-            # Combine relevant content for AI interpretation
-            context = "\n\n".join([result.get('content', '') for result in search_results])
             # Generate AI interpretation
             chain = self.prompt | self.llm
@@ -117,7 +147,9 @@ class LegalTextSearchBot:
             return "\n".join(raw_results), ai_response
         except Exception as e:
-            return f"Error processing query: {str(e)}", ""
 def create_interface():
     """Create the Gradio interface"""

 from dotenv import load_dotenv
 from huggingface_hub import login
 from sentence_transformers import SentenceTransformer
+import json
 # Load environment variables
 load_dotenv()
             # Generate embedding for the query
             query_embedding = self.embedding_model.encode(query).tolist()
+            # First try searching in searchable_text
+            results = list(self.collection.vector_find(
                 query_embedding,
+                limit=5,
+                fields=["section_number", "title", "chapter_info", "content", "searchable_text"]
+            ))
+            if not results:
+                # If no results, try a more general search
+                results = list(self.collection.find(
+                    {},
+                    limit=5
+                ))
+            return results
         except Exception as e:
             print(f"Error searching AstraDB: {str(e)}")
             return []
+    def format_section(self, section: Dict) -> str:
+        """Format a section for display"""
+        try:
+            chapter_info = section.get('chapter_info', {})
+            chapter_title = chapter_info.get('title', 'N/A') if isinstance(chapter_info, dict) else 'N/A'
+            return f"""
+Section {section.get('section_number', 'N/A')}: {section.get('title', 'N/A')}
+Chapter: {chapter_title}
+Content:
+{section.get('content', 'N/A')}
+{"="*80}
+"""
+        except Exception as e:
+            print(f"Error formatting section: {str(e)}")
+            return str(section)
     def search_sections(self, query: str) -> Tuple[str, str]:
         """Search legal sections and return both raw results and AI interpretation"""
         try:
             search_results = self._search_astra(query)
             if not search_results:
+                return "No relevant sections found.", "I apologize, but I cannot find relevant sections in the database."
             # Format raw results
             raw_results = []
+            context_parts = []
             for result in search_results:
+                # Format for display
+                raw_results.append(self.format_section(result))
+                # Add to context for AI
+                context_parts.append(f"""
+Section {result.get('section_number')}: {result.get('title')}
+{result.get('content', '')}
+""")
+            # Combine context for AI
+            context = "\n\n".join(context_parts)
             # Generate AI interpretation
             chain = self.prompt | self.llm
             return "\n".join(raw_results), ai_response
         except Exception as e:
+            error_msg = f"Error processing query: {str(e)}"
+            print(error_msg)
+            return error_msg, "An error occurred while processing your query."
 def create_interface():
     """Create the Gradio interface"""