radarbackend11262024v11

Runtime error

App Files Files Community

Pijush2023 commited on Sep 13, 2024

Commit

a799bca

verified ·

1 Parent(s): 0df7f00

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -55

app.py CHANGED Viewed

@@ -484,47 +484,7 @@ import re
 #     return cleaned_response
-# def clean_response(response_text):
-#     # Remove system and user tags
-#     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
-#     response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
-#     response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
-#     # Extract the document name and page number
-#     document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
-#     if document_match:
-#         document_name = document_match.group(1).split('/')[-1]  # Get the document name
-#         page_number = document_match.group(2)  # Get the page number
-#     else:
-#         document_name = "Unknown"
-#         page_number = "Unknown"
-#     # Remove the 'Document(metadata=...' part and keep only the page content
-#     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
-#     # Remove any unwanted escape characters like \u and \u00
-#     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
-#     # Add spaces between words and dates (e.g., "born04/04/1963" becomes "born 04/04/1963")
-#     response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
-#     response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
-#     # Clean up the text by removing extra whitespace
-#     cleaned_response = response_text.strip()
-#     cleaned_response = re.sub(r'\s+', ' ', cleaned_response)
-#     # Ensure the response is conversational and organized
-#     cleaned_response = cleaned_response.replace('1.', '\n1.').replace('2.', '\n2.').replace('3.', '\n3.').replace('4.', '\n4.').replace('5.', '\n5.')
-#     # Return the cleaned response with the document name and page number
-#     final_response = f"""
-# Sure! The Responses are as follows:
-# Document name - {document_name}
-# Page No - {page_number}
-# Response - {cleaned_response}
-# """
-#     return final_response
 # def clean_response(response_text):
@@ -532,7 +492,7 @@ import re
 #     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
 #     response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
 #     response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
 #     # Extract the document name and page number
 #     document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
 #     if document_match:
@@ -541,25 +501,24 @@ import re
 #     else:
 #         document_name = "Unknown"
 #         page_number = "Unknown"
 #     # Remove the 'Document(metadata=...' part and keep only the page content
 #     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
 #     # Remove any unwanted escape characters like \u and \u00
 #     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
-#     # Add spaces between words and dates (e.g., "born04/04/1963" becomes "born 04/04/1963")
 #     response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
 #     response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
-#     # Clean up the text by removing extra whitespace
-#     cleaned_response = response_text.strip()
-#     cleaned_response = re.sub(r'\s+', ' ', cleaned_response)
-#     # Ensure the response is conversational and organized by removing any prefixes like "Document:"
-#     cleaned_response = re.sub(r"^Sure! The Responses are as follows: - Document: \"", '', cleaned_response)
-#     # Return the cleaned response with bullet points
 #     final_response = f"""
 # Sure! The Responses are as follows:
 # • Document name - {document_name}
@@ -569,7 +528,6 @@ import re
 #     return final_response
 def clean_response(response_text):
     # Remove system and user tags
     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
@@ -591,9 +549,10 @@ def clean_response(response_text):
     # Remove any unwanted escape characters like \u and \u00
     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
-    # Ensure proper spacing between words and dates
-    response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
-    response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
     # Remove the phrase "Sure! The Responses are as follows:" from the actual content
     response_text = re.sub(r'Sure! The Responses are as follows:', '', response_text).strip()
@@ -618,7 +577,6 @@ Sure! The Responses are as follows:
 # Define a new template specifically for GPT-4o-mini in VDB Details mode
 gpt4o_mini_template_details = f"""
 As a highly specialized assistant, I provide precise, detailed, and informative responses. On this bright day of {current_date}, I'm equipped to assist with all your queries about Birmingham, Alabama, offering detailed insights tailored to your needs.

 #     return cleaned_response
 # def clean_response(response_text):
 #     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
 #     response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
 #     response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
 #     # Extract the document name and page number
 #     document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
 #     if document_match:
 #     else:
 #         document_name = "Unknown"
 #         page_number = "Unknown"
 #     # Remove the 'Document(metadata=...' part and keep only the page content
 #     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
 #     # Remove any unwanted escape characters like \u and \u00
 #     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
+#     # Ensure proper spacing between words and dates
 #     response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
 #     response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
+#     # Remove the phrase "Sure! The Responses are as follows:" from the actual content
+#     response_text = re.sub(r'Sure! The Responses are as follows:', '', response_text).strip()
+#     # Clean up the text by removing extra whitespace
+#     cleaned_response = re.sub(r'\s+', ' ', response_text).strip()
+#     # Format the final response with bullet points
 #     final_response = f"""
 # Sure! The Responses are as follows:
 # • Document name - {document_name}
 #     return final_response
 def clean_response(response_text):
     # Remove system and user tags
     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
     # Remove any unwanted escape characters like \u and \u00
     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
+    # Add spaces between words and dates
+    response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)  # Add space between letter and number
+    response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)  # Add space between number and letter
+    response_text = re.sub(r'([A-Z])([A-Z][a-z])', r'\1 \2', response_text)  # Add space between capital letters and words
     # Remove the phrase "Sure! The Responses are as follows:" from the actual content
     response_text = re.sub(r'Sure! The Responses are as follows:', '', response_text).strip()
 # Define a new template specifically for GPT-4o-mini in VDB Details mode
 gpt4o_mini_template_details = f"""
 As a highly specialized assistant, I provide precise, detailed, and informative responses. On this bright day of {current_date}, I'm equipped to assist with all your queries about Birmingham, Alabama, offering detailed insights tailored to your needs.