radarbackend11262024v11

Runtime error

App Files Files Community

Pijush2023 commited on Sep 15, 2024

Commit

b773d17

verified ·

1 Parent(s): 87009cb

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -58

app.py CHANGED Viewed

@@ -576,58 +576,13 @@ import re
 import re
-# def clean_response(response_text):
-#     # Remove system and user tags
-#     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
-#     response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
-#     response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
-#     # Extract the document name and page number from updated pattern
-#     document_match = re.search(r"Document\(metadata=\{'source': '(.+?)', 'page': (\d+)\}", response_text)
-#     if document_match:
-#         document_name = document_match.group(1).split('/')[-1]  # Get the document name
-#         page_number = document_match.group(2)  # Get the page number
-#     else:
-#         document_name = "Unknown"
-#         page_number = "Unknown"
-#     # Remove the entire 'Document(metadata=...' and any mention of it from the response
-#     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
-#     # Remove any mention of "Document:" in the response
-#     response_text = re.sub(r'- Document:.*', '', response_text)
-#     # Remove any unwanted escape characters like \u and \u00
-#     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
-#     # Ensure proper spacing between words and dates
-#     response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
-#     response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
-#     # Remove the phrase "Sure! The Responses are as follows:" from the actual content
-#     response_text = re.sub(r'Sure! The Responses are as follows:', '', response_text).strip()
-#     # Clean up the text by removing extra whitespace
-#     cleaned_response = re.sub(r'\s+', ' ', response_text).strip()
-#     # Format the final response with bullet points
-#     final_response = f"""
-# Sure! Here is the response for your Query:
-# • Document name - {document_name}
-# • Page No - {page_number}
-# • Responses - {cleaned_response}
-# """
-#     return final_response
 def clean_response(response_text):
     # Remove system and user tags
     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
     response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
     response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
-    # Extract the document name and page number
     document_match = re.search(r"Document\(metadata=\{'source': '(.+?)', 'page': (\d+)\}", response_text)
     if document_match:
@@ -639,9 +594,9 @@ def clean_response(response_text):
     # Remove the entire 'Document(metadata=...' and any mention of it from the response
     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
-    # Extract top 5 fetched results (assuming the top 5 results are the first 5 lines of content)
-    top_results = response_text.split('\n')[:5]  # Adjust this as per your actual data structure
     # Remove any unwanted escape characters like \u and \u00
     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
@@ -657,15 +612,12 @@ def clean_response(response_text):
     cleaned_response = re.sub(r'\s+', ' ', response_text).strip()
     # Format the final response with bullet points
-    top_five_formatted = ''.join([f'{i+1}. {result.strip()}\n' for i, result in enumerate(top_results)])
-    final_response = (
-        f"Sure! Here is the response for your Query:\n"
-        f"• Document name - {document_name}\n"
-        f"• Page No - {page_number}\n"
-        f"• Top 5 Fetched Results:\n{top_five_formatted}"
-        f"• Actual Response - {cleaned_response}"
-    )
     return final_response
@@ -676,6 +628,8 @@ def clean_response(response_text):
 # Define a new template specifically for GPT-4o-mini in VDB Details mode
 gpt4o_mini_template_details = f"""
 As a highly specialized assistant, I provide precise, detailed, and informative responses. On this bright day of {current_date}, I'm equipped to assist with all your queries about Birmingham, Alabama, offering detailed insights tailored to your needs.

 import re
 def clean_response(response_text):
     # Remove system and user tags
     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
     response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
     response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
+    # Extract the document name and page number from updated pattern
     document_match = re.search(r"Document\(metadata=\{'source': '(.+?)', 'page': (\d+)\}", response_text)
     if document_match:
     # Remove the entire 'Document(metadata=...' and any mention of it from the response
     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
+    # Remove any mention of "Document:" in the response
+    response_text = re.sub(r'- Document:.*', '', response_text)
     # Remove any unwanted escape characters like \u and \u00
     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
     cleaned_response = re.sub(r'\s+', ' ', response_text).strip()
     # Format the final response with bullet points
+    final_response = f"""
+Sure! Here is the response for your Query:
+• Document name - {document_name}
+• Page No - {page_number}
+• Responses - {cleaned_response}
+"""
     return final_response
 # Define a new template specifically for GPT-4o-mini in VDB Details mode
 gpt4o_mini_template_details = f"""
 As a highly specialized assistant, I provide precise, detailed, and informative responses. On this bright day of {current_date}, I'm equipped to assist with all your queries about Birmingham, Alabama, offering detailed insights tailored to your needs.