Spaces:

kaitwithkwk
/

testing-3.7

Sleeping

App Files Files Community

kaitwithkwk commited on 25 days ago

Commit

13e2469

verified ·

1 Parent(s): 8eb3105

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -6

app.py CHANGED Viewed

@@ -1,30 +1,44 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 def respond(message, history):
-    messages = [{"role": "system", "content": "I am a kind chatbot."}]
     # Add all previous messages to the messages list
     for human, assistant in history:
         messages.append({"role": "user", "content": human})
         messages.append({"role": "assistant", "content": assistant})
-    # Add the current user's message to the messages list
     messages.append({"role": "user", "content": message})
     response = ""
     for chunk in client.chat_completion(
         messages,
-        max_tokens=100,
-        temperature=0.1,
         stream=True
     ):
         token = chunk.choices[0].delta.content
         response += token
-        # Filter out any unwanted tokens like </s> or <|endoftext|>, [USER], [/ASS]
-        cleaned_response = response.replace("</s>", "").replace("<|endoftext|>", "").replace("[USER]", "").replace("[/ASS]", "").strip()
         yield cleaned_response
 chatbot = gr.ChatInterface(respond)

 import gradio as gr
 from huggingface_hub import InferenceClient
+import re
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 def respond(message, history):
+    messages = [{"role": "system", "content": "You are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe."}]
     # Add all previous messages to the messages list
     for human, assistant in history:
         messages.append({"role": "user", "content": human})
         messages.append({"role": "assistant", "content": assistant})
+    # Add the current user\"s message to the messages list
     messages.append({"role": "user", "content": message})
     response = ""
     for chunk in client.chat_completion(
         messages,
+        max_tokens=500,
+        temperature=0.5,
         stream=True
     ):
         token = chunk.choices[0].delta.content
         response += token
+        # Enhanced post-processing to handle unwanted patterns
+        cleaned_response = response
+        # Remove special tokens and unwanted labels more aggressively
+        # Added \s* to catch spaces around the tags, and made the regex more comprehensive
+        cleaned_response = re.sub(r"<\|endoftext\|>|<\|user\|>|<\|assistant\|>|<\|system\>|\s*\[USER\]\s*|\s*\[/ASS\]\s*|\s*\[ASS\]\s*|\s*\[/USER\]\s*|\s*\[INST\]\s*|\s*\[/INST\]\s*|\s*\[ASSIST\]\s*|\s*\[/ASSIST\]\s*", "", cleaned_response)
+        # Remove any remaining HTML-like tags (e.g., <p>, <div>) that might appear
+        cleaned_response = re.sub(r"<[^>]*>", "", cleaned_response)
+        # Clean up extra whitespace and newlines, ensuring single newlines between paragraphs
+        cleaned_response = re.sub(r"\n+", "\n", cleaned_response)
+        cleaned_response = cleaned_response.strip()
         yield cleaned_response
 chatbot = gr.ChatInterface(respond)