Spaces:

mimifuel2018
/

Qwen2.5-72B

Sleeping

App Files Files Community

mimifuel2018 commited on Nov 14, 2024

Commit

a60db2d

verified ·

1 Parent(s): 47ae6b4

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -8

app.py CHANGED Viewed

@@ -55,24 +55,24 @@ def model_chat(query: Optional[str], history: Optional[History], system: str) ->
         query = ''
     if history is None:
         history = []
-    # Convert history to a list of messages
     messages = history_to_messages(history, system)
     messages.append({'role': 'user', 'content': query})
-    # Prepare the payload for Hugging Face Inference API
     payload = {"inputs": query, "parameters": {"max_new_tokens": 150}, "history": messages}
     headers = {"Authorization": f"Bearer {os.getenv('HF_TOKEN')}"}
     try:
-        # Request generation with Hugging Face Inference API
         response = requests.post(f"https://api-inference.huggingface.co/models/Qwen/Qwen2.5-72B-Instruct",
                                  json=payload, headers=headers)
         if response.status_code == 200:
             response_data = response.json()
-            # Handle the response as a list or dict
             if isinstance(response_data, list):
                 response_text = response_data[0].get('generated_text', '')
             else:
@@ -83,20 +83,18 @@ def model_chat(query: Optional[str], history: Optional[History], system: str) ->
             # Update history with the new assistant response and return it
             history.append([query, response_text])
-            system, history = messages_to_history(messages + [{'role': 'assistant', 'content': response_text}])
             return response_text, history, system
         else:
-            # Log error message to file and display it in Gradio
             error_message = f"Error {response.status_code}: {response.json().get('error', response.text)}"
             log_history_to_file(query, error_message)
             return error_message, history, system
     except Exception as e:
-        # Log any unexpected exceptions
         error_message = f"Exception: {str(e)}"
         log_history_to_file(query, error_message)
         return error_message, history, system
 # Gradio Interface Setup
 with gr.Blocks() as demo:
     gr.Markdown("<center><font size=8>Qwen2.5-72B-Instruct👾</center>")

         query = ''
     if history is None:
         history = []
+    # Ensure the query is clearly asking for numbers
+    if 'next numbers' in query or 'give me numbers after' in query:
+        query = "Please give me the next 10 numbers after 10, starting from 11."
     messages = history_to_messages(history, system)
     messages.append({'role': 'user', 'content': query})
     payload = {"inputs": query, "parameters": {"max_new_tokens": 150}, "history": messages}
     headers = {"Authorization": f"Bearer {os.getenv('HF_TOKEN')}"}
     try:
         response = requests.post(f"https://api-inference.huggingface.co/models/Qwen/Qwen2.5-72B-Instruct",
                                  json=payload, headers=headers)
         if response.status_code == 200:
             response_data = response.json()
             if isinstance(response_data, list):
                 response_text = response_data[0].get('generated_text', '')
             else:
             # Update history with the new assistant response and return it
             history.append([query, response_text])
             return response_text, history, system
         else:
             error_message = f"Error {response.status_code}: {response.json().get('error', response.text)}"
             log_history_to_file(query, error_message)
             return error_message, history, system
     except Exception as e:
         error_message = f"Exception: {str(e)}"
         log_history_to_file(query, error_message)
         return error_message, history, system
 # Gradio Interface Setup
 with gr.Blocks() as demo:
     gr.Markdown("<center><font size=8>Qwen2.5-72B-Instruct👾</center>")