Pijush2023 commited on
Commit
2b899f6
·
verified ·
1 Parent(s): abe45f3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +45 -18
app.py CHANGED
@@ -463,33 +463,60 @@ def bot(history, choice, tts_choice, retrieval_mode, model_choice):
463
 
464
  import re
465
 
466
- def clean_response(response_text):
467
- # Remove system and user tags
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
468
  response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
469
  response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
470
  response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
471
- #-------
 
 
 
 
472
  response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
473
- # Add spaces between words and dates (e.g., "born04/04/1963" becomes "born 04/04/1963")
 
474
  response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
475
  response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
476
- #--------
477
- # Clean up the text by removing extra whitespace
478
- cleaned_response = response_text.strip()
479
- cleaned_response = re.sub(r'\s+', ' ', cleaned_response)
480
-
481
- # Ensure the response is conversational and organized
482
- cleaned_response = cleaned_response.replace('1.', '\n1.').replace('2.', '\n2.').replace('3.', '\n3.').replace('4.', '\n4.').replace('5.', '\n5.')
483
-
484
- return cleaned_response
485
-
486
-
487
-
488
-
489
-
490
 
 
 
491
 
 
 
492
 
 
 
 
 
 
 
 
 
 
493
 
494
 
495
  # Define a new template specifically for GPT-4o-mini in VDB Details mode
 
463
 
464
  import re
465
 
466
+ # def clean_response(response_text):
467
+ # # Remove system and user tags
468
+ # response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
469
+ # response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
470
+ # response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
471
+ # #-------
472
+ # response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
473
+ # # Add spaces between words and dates (e.g., "born04/04/1963" becomes "born 04/04/1963")
474
+ # response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
475
+ # response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
476
+ # #--------
477
+ # # Clean up the text by removing extra whitespace
478
+ # cleaned_response = response_text.strip()
479
+ # cleaned_response = re.sub(r'\s+', ' ', cleaned_response)
480
+
481
+ # # Ensure the response is conversational and organized
482
+ # cleaned_response = cleaned_response.replace('1.', '\n1.').replace('2.', '\n2.').replace('3.', '\n3.').replace('4.', '\n4.').replace('5.', '\n5.')
483
+
484
+ # return cleaned_response
485
+
486
+ def clean_response(response_text, document_name, page_number):
487
+ #Remove System and user Tag
488
  response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
489
  response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
490
  response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
491
+
492
+ # Remove metadata and unwanted parts (like 'Document(metadata...' etc.)
493
+ response_text = re.sub(r'Document\(metadata=\{.*?\},page_content="', '', response_text)
494
+
495
+ # Remove any unwanted escape characters like \u and \u00
496
  response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
497
+
498
+ # Add spaces between words and numbers (e.g., "born04/04/1963" becomes "born 04/04/1963")
499
  response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
500
  response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
501
+
502
+ # Remove any extra quotation marks at the end
503
+ response_text = response_text.rstrip('"')
 
 
 
 
 
 
 
 
 
 
 
504
 
505
+ # Ensure spaces between words
506
+ response_text = re.sub(r'([a-z])([A-Z])', r'\1 \2', response_text)
507
 
508
+ # Clean up any extra spaces that may result from the replacements
509
+ response_text = re.sub(r'\s+', ' ', response_text).strip()
510
 
511
+ # Now, format the output as required, directly within the clean_response function
512
+ formatted_response = f"""
513
+ Sure! The Responses are as follows:
514
+ Document name - {document_name}
515
+ Page No - {page_number}
516
+ Response - {response_text}
517
+ """
518
+
519
+ return formatted_response
520
 
521
 
522
  # Define a new template specifically for GPT-4o-mini in VDB Details mode