Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -463,60 +463,26 @@ def bot(history, choice, tts_choice, retrieval_mode, model_choice):
|
|
463 |
|
464 |
import re
|
465 |
|
466 |
-
|
467 |
-
#
|
468 |
-
# response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
|
469 |
-
# response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
|
470 |
-
# response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
|
471 |
-
# #-------
|
472 |
-
# response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
|
473 |
-
# # Add spaces between words and dates (e.g., "born04/04/1963" becomes "born 04/04/1963")
|
474 |
-
# response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
|
475 |
-
# response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
|
476 |
-
# #--------
|
477 |
-
# # Clean up the text by removing extra whitespace
|
478 |
-
# cleaned_response = response_text.strip()
|
479 |
-
# cleaned_response = re.sub(r'\s+', ' ', cleaned_response)
|
480 |
-
|
481 |
-
# # Ensure the response is conversational and organized
|
482 |
-
# cleaned_response = cleaned_response.replace('1.', '\n1.').replace('2.', '\n2.').replace('3.', '\n3.').replace('4.', '\n4.').replace('5.', '\n5.')
|
483 |
-
|
484 |
-
# return cleaned_response
|
485 |
-
|
486 |
-
def clean_response(response_text, document_name, page_number):
|
487 |
-
#Remove System and user Tag
|
488 |
response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
|
489 |
response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
|
490 |
response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
|
491 |
-
|
492 |
-
# Remove metadata and unwanted parts (like 'Document(metadata...' etc.)
|
493 |
-
response_text = re.sub(r'Document\(metadata=\{.*?\},page_content="', '', response_text)
|
494 |
-
|
495 |
-
# Remove any unwanted escape characters like \u and \u00
|
496 |
response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
|
497 |
-
|
498 |
-
# Add spaces between words and numbers (e.g., "born04/04/1963" becomes "born 04/04/1963")
|
499 |
response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
|
500 |
response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
|
501 |
-
|
502 |
-
#
|
503 |
-
|
|
|
504 |
|
505 |
-
# Ensure
|
506 |
-
|
507 |
|
508 |
-
|
509 |
-
response_text = re.sub(r'\s+', ' ', response_text).strip()
|
510 |
|
511 |
-
# Now, format the output as required, directly within the clean_response function
|
512 |
-
formatted_response = f"""
|
513 |
-
Sure! The Responses are as follows:
|
514 |
-
Document name - {document_name}
|
515 |
-
Page No - {page_number}
|
516 |
-
Response - {response_text}
|
517 |
-
"""
|
518 |
-
|
519 |
-
return formatted_response
|
520 |
|
521 |
|
522 |
# Define a new template specifically for GPT-4o-mini in VDB Details mode
|
|
|
463 |
|
464 |
import re
|
465 |
|
466 |
+
def clean_response(response_text):
|
467 |
+
# Remove system and user tags
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
468 |
response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
|
469 |
response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
|
470 |
response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
|
471 |
+
#-------
|
|
|
|
|
|
|
|
|
472 |
response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
|
473 |
+
# Add spaces between words and dates (e.g., "born04/04/1963" becomes "born 04/04/1963")
|
|
|
474 |
response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
|
475 |
response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
|
476 |
+
#--------
|
477 |
+
# Clean up the text by removing extra whitespace
|
478 |
+
cleaned_response = response_text.strip()
|
479 |
+
cleaned_response = re.sub(r'\s+', ' ', cleaned_response)
|
480 |
|
481 |
+
# Ensure the response is conversational and organized
|
482 |
+
cleaned_response = cleaned_response.replace('1.', '\n1.').replace('2.', '\n2.').replace('3.', '\n3.').replace('4.', '\n4.').replace('5.', '\n5.')
|
483 |
|
484 |
+
return cleaned_response
|
|
|
485 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
486 |
|
487 |
|
488 |
# Define a new template specifically for GPT-4o-mini in VDB Details mode
|