radarbackend11262024v11

Runtime error

App Files Files Community

Pijush2023 commited on Sep 15, 2024

Commit

e9a0eca

verified ·

1 Parent(s): 463a37c

Update app.py

Browse files

Files changed (1) hide show

app.py +72 -47

app.py CHANGED Viewed

@@ -353,6 +353,24 @@ QA_CHAIN_PROMPT_2 = PromptTemplate(input_variables=["context", "question"], temp
 # Sure! Here's the information:
 # """
 phi_custom_template = """
 <|system|>
 Sei un esperto della lingua italiana e un madrelingua italiano. Il tuo compito è fornire risposte concise, dirette e brevi basate sul documento fornito. Dovresti restituire le informazioni nel seguente formato:
@@ -369,6 +387,13 @@ Question: {question}<|end|>
 <|assistant|>
 Sure! The Responses are as follows:
 """
 def generate_bot_response(history, choice, retrieval_mode, model_choice):
     if not history:
@@ -445,47 +470,6 @@ def bot(history, choice, tts_choice, retrieval_mode, model_choice):
 import re
-# def clean_response(response_text):
-#     # Remove system and user tags
-#     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
-#     response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
-#     response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
-#     # Extract the document name and page number
-#     document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
-#     if document_match:
-#         document_name = document_match.group(1).split('/')[-1]  # Get the document name
-#         page_number = document_match.group(2)  # Get the page number
-#     else:
-#         document_name = "Unknown"
-#         page_number = "Unknown"
-#     # Remove the 'Document(metadata=...' part and keep only the page content
-#     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
-#     # Remove any unwanted escape characters like \u and \u00
-#     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
-#     # Ensure proper spacing between words and dates
-#     response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
-#     response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
-#     # Remove the phrase "Sure! The Responses are as follows:" from the actual content
-#     response_text = re.sub(r'Sure! The Responses are as follows:', '', response_text).strip()
-#     # Clean up the text by removing extra whitespace
-#     cleaned_response = re.sub(r'\s+', ' ', response_text).strip()
-#     # Format the final response with bullet points
-#     final_response = f"""
-# Sure! The Responses are as follows:
-# • Document name - {document_name}
-# • Page No - {page_number}
-# • Response - {cleaned_response}
-# """
-#     return final_response
 def clean_response(response_text):
     # Remove system and user tags
     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
@@ -494,7 +478,6 @@ def clean_response(response_text):
     # Extract the document name and page number
     document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
-    document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
     if document_match:
         document_name = document_match.group(1).split('/')[-1]  # Get the document name
         page_number = document_match.group(2)  # Get the page number
@@ -502,11 +485,8 @@ def clean_response(response_text):
         document_name = "Unknown"
         page_number = "Unknown"
-    # Remove the entire 'Document(metadata=...' and any mention of it from the response
     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
-    # Remove any mention of "Document:" in the response
-    response_text = re.sub(r'- Document:.*', '', response_text)
     # Remove any unwanted escape characters like \u and \u00
     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
@@ -523,7 +503,7 @@ def clean_response(response_text):
     # Format the final response with bullet points
     final_response = f"""
-Sure! Here is the response for your Query:
 • Document name - {document_name}
 • Page No - {page_number}
 • Response - {cleaned_response}
@@ -531,6 +511,51 @@ Sure! Here is the response for your Query:
     return final_response

 # Sure! Here's the information:
 # """
+# phi_custom_template = """
+# <|system|>
+# Sei un esperto della lingua italiana e un madrelingua italiano. Il tuo compito è fornire risposte concise, dirette e brevi basate sul documento fornito. Dovresti restituire le informazioni nel seguente formato:
+# - Nome del documento: (il nome del documento)
+# - Numero di pagina: (numero di pagina)
+# - Contenuto effettivo: (contenuto rilevante del documento)
+# Alla fine, fornisci una sezione separata per la risposta nel seguente formato:
+# - Risposta: (la risposta alla domanda)
+# Se non riesci a trovare la risposta nel documento, rispondi semplicemente con "Questa domanda è al di là delle mie conoscenze". Ecco i dettagli del documento da considerare:
+# <|end|>
+# <|user|>
+# {context}
+# Question: {question}<|end|>
+# <|assistant|>
+# Sure! The Responses are as follows:
+# """
 phi_custom_template = """
 <|system|>
 Sei un esperto della lingua italiana e un madrelingua italiano. Il tuo compito è fornire risposte concise, dirette e brevi basate sul documento fornito. Dovresti restituire le informazioni nel seguente formato:
 <|assistant|>
 Sure! The Responses are as follows:
 """
+<|end|>
+<|user|>
+{context}
+Question: {question}<|end|>
+<|assistant|>
+Sure! The Responses are as follows:
+"""
 def generate_bot_response(history, choice, retrieval_mode, model_choice):
     if not history:
 import re
 def clean_response(response_text):
     # Remove system and user tags
     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
     # Extract the document name and page number
     document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
     if document_match:
         document_name = document_match.group(1).split('/')[-1]  # Get the document name
         page_number = document_match.group(2)  # Get the page number
         document_name = "Unknown"
         page_number = "Unknown"
+    # Remove the 'Document(metadata=...' part and keep only the page content
     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
     # Remove any unwanted escape characters like \u and \u00
     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
     # Format the final response with bullet points
     final_response = f"""
+Sure! The Responses are as follows:
 • Document name - {document_name}
 • Page No - {page_number}
 • Response - {cleaned_response}
     return final_response
+# def clean_response(response_text):
+#     # Remove system and user tags
+#     response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
+#     response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
+#     response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
+#     # Extract the document name and page number
+#     document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
+#     document_match = re.search(r"Document\(metadata=\{'source':'(.+?)','page':(\d+)\}", response_text)
+#     if document_match:
+#         document_name = document_match.group(1).split('/')[-1]  # Get the document name
+#         page_number = document_match.group(2)  # Get the page number
+#     else:
+#         document_name = "Unknown"
+#         page_number = "Unknown"
+#     # Remove the entire 'Document(metadata=...' and any mention of it from the response
+#     response_text = re.sub(r'Document\(metadata=\{.*?\},page_content=', '', response_text, flags=re.DOTALL)
+#     # Remove any mention of "Document:" in the response
+#     response_text = re.sub(r'- Document:.*', '', response_text)
+#     # Remove any unwanted escape characters like \u and \u00
+#     response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
+#     # Ensure proper spacing between words and dates
+#     response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
+#     response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
+#     # Remove the phrase "Sure! The Responses are as follows:" from the actual content
+#     response_text = re.sub(r'Sure! The Responses are as follows:', '', response_text).strip()
+#     # Clean up the text by removing extra whitespace
+#     cleaned_response = re.sub(r'\s+', ' ', response_text).strip()
+#     # Format the final response with bullet points
+#     final_response = f"""
+# Sure! Here is the response for your Query:
+# • Document name - {document_name}
+# • Page No - {page_number}
+# • Response - {cleaned_response}
+# """
+#     return final_response