Pijush2023 commited on
Commit
fbaa4c6
·
verified ·
1 Parent(s): 2b899f6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -45
app.py CHANGED
@@ -463,60 +463,26 @@ def bot(history, choice, tts_choice, retrieval_mode, model_choice):
463
 
464
  import re
465
 
466
- # def clean_response(response_text):
467
- # # Remove system and user tags
468
- # response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
469
- # response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
470
- # response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
471
- # #-------
472
- # response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
473
- # # Add spaces between words and dates (e.g., "born04/04/1963" becomes "born 04/04/1963")
474
- # response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
475
- # response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
476
- # #--------
477
- # # Clean up the text by removing extra whitespace
478
- # cleaned_response = response_text.strip()
479
- # cleaned_response = re.sub(r'\s+', ' ', cleaned_response)
480
-
481
- # # Ensure the response is conversational and organized
482
- # cleaned_response = cleaned_response.replace('1.', '\n1.').replace('2.', '\n2.').replace('3.', '\n3.').replace('4.', '\n4.').replace('5.', '\n5.')
483
-
484
- # return cleaned_response
485
-
486
- def clean_response(response_text, document_name, page_number):
487
- #Remove System and user Tag
488
  response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
489
  response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
490
  response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
491
-
492
- # Remove metadata and unwanted parts (like 'Document(metadata...' etc.)
493
- response_text = re.sub(r'Document\(metadata=\{.*?\},page_content="', '', response_text)
494
-
495
- # Remove any unwanted escape characters like \u and \u00
496
  response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
497
-
498
- # Add spaces between words and numbers (e.g., "born04/04/1963" becomes "born 04/04/1963")
499
  response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
500
  response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
501
-
502
- # Remove any extra quotation marks at the end
503
- response_text = response_text.rstrip('"')
 
504
 
505
- # Ensure spaces between words
506
- response_text = re.sub(r'([a-z])([A-Z])', r'\1 \2', response_text)
507
 
508
- # Clean up any extra spaces that may result from the replacements
509
- response_text = re.sub(r'\s+', ' ', response_text).strip()
510
 
511
- # Now, format the output as required, directly within the clean_response function
512
- formatted_response = f"""
513
- Sure! The Responses are as follows:
514
- Document name - {document_name}
515
- Page No - {page_number}
516
- Response - {response_text}
517
- """
518
-
519
- return formatted_response
520
 
521
 
522
  # Define a new template specifically for GPT-4o-mini in VDB Details mode
 
463
 
464
  import re
465
 
466
+ def clean_response(response_text):
467
+ # Remove system and user tags
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
468
  response_text = re.sub(r'<\|system\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
469
  response_text = re.sub(r'<\|user\|>.*?<\|end\|>', '', response_text, flags=re.DOTALL)
470
  response_text = re.sub(r'<\|assistant\|>', '', response_text, flags=re.DOTALL)
471
+ #-------
 
 
 
 
472
  response_text = re.sub(r'\\u[0-9A-Fa-f]{4}', '', response_text)
473
+ # Add spaces between words and dates (e.g., "born04/04/1963" becomes "born 04/04/1963")
 
474
  response_text = re.sub(r'([a-zA-Z])(\d)', r'\1 \2', response_text)
475
  response_text = re.sub(r'(\d)([a-zA-Z])', r'\1 \2', response_text)
476
+ #--------
477
+ # Clean up the text by removing extra whitespace
478
+ cleaned_response = response_text.strip()
479
+ cleaned_response = re.sub(r'\s+', ' ', cleaned_response)
480
 
481
+ # Ensure the response is conversational and organized
482
+ cleaned_response = cleaned_response.replace('1.', '\n1.').replace('2.', '\n2.').replace('3.', '\n3.').replace('4.', '\n4.').replace('5.', '\n5.')
483
 
484
+ return cleaned_response
 
485
 
 
 
 
 
 
 
 
 
 
486
 
487
 
488
  # Define a new template specifically for GPT-4o-mini in VDB Details mode