Spaces:

mimifuel2018
/

Qwen2.5-72B

Sleeping

App Files Files Community

mimifuel2018 commited on Nov 14, 2024

Commit

a331c33

verified ·

1 Parent(s): b56c3a2

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -40

app.py CHANGED Viewed

@@ -1,32 +1,16 @@
 import os
 import gradio as gr
 from typing import List, Optional, Tuple, Dict
 import dashscope
 from dashscope import Generation
 from dashscope.api_entities.dashscope_response import Role
-# Configuration
-default_system = 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.'
-dashscope.api_key = os.getenv('HF_TOKEN')  # Check if this is loading correctly
-# **Test Token Retrieval** (remove after testing)
-print("Token:", dashscope.api_key)
-# Typing definitions
-History = List[Tuple[str, str]]
-Messages = List[Dict[str, str]]
-import os
-import gradio as gr
-from typing import List, Optional, Tuple, Dict
-import dashscope
-from dashscope import Generation
-from dashscope.api_entities.dashscope_response import Role
 # Configuration
 default_system = 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.'
-dashscope.api_key = os.getenv('HF_TOKEN')
 # Typing definitions
 History = List[Tuple[str, str]]
@@ -71,37 +55,46 @@ def model_chat(query: Optional[str], history: Optional[History], system: str) ->
         query = ''
     if history is None:
         history = []
     messages = history_to_messages(history, system)
-    messages.append({'role': Role.USER, 'content': query})
     try:
-        gen = Generation.call(
-            model='qwen2.5-72b-instruct',
-            messages=messages,
-            result_format='message',
-            stream=True
-        )
-        for response in gen:
-            if response.status_code == 200:
-                response_text = response.output.choices[0].message.content
-                # Log the chat to file
-                log_history_to_file(query, response_text)
-                # Update history with the new assistant response
-                history.append((query, response_text))
-                return response_text, history, system
             else:
-                error_message = f"Error: {response.status_code} - {response.message}"
-                log_history_to_file(query, error_message)
-                return error_message, history, system
     except Exception as e:
         error_message = f"Exception: {str(e)}"
         log_history_to_file(query, error_message)
         return error_message, history, system
 # Gradio Interface Setup
 with gr.Blocks() as demo:
     gr.Markdown("<center><font size=8>Qwen2.5-72B-Instruct👾</center>")
@@ -120,6 +113,7 @@ with gr.Blocks() as demo:
         clear_history = gr.Button("🧹 Clear history")
         submit = gr.Button("🚀 Send")
     textbox.submit(model_chat,
                    inputs=[textbox, chatbot, system_state],
                    outputs=[textbox, chatbot, system_input],
@@ -142,4 +136,4 @@ with gr.Blocks() as demo:
 # Launching Gradio Interface with reduced threads for free plan
 demo.queue(api_open=False)
-demo.launch(max_threads=10)

 import os
 import gradio as gr
+from http import HTTPStatus
 from typing import List, Optional, Tuple, Dict
 import dashscope
 from dashscope import Generation
 from dashscope.api_entities.dashscope_response import Role
+import requests  # <-- Add this line to import the requests library
 # Configuration
 default_system = 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.'
+dashscope.api_key = os.getenv('HF_TOKEN')  # Replace 'YOUR_API_TOKEN' with your actual API token.
 # Typing definitions
 History = List[Tuple[str, str]]
         query = ''
     if history is None:
         history = []
+    # Ensure the query is clearly asking for numbers
+    if 'next numbers' in query or 'give me numbers after' in query:
+        query = "Please give me the next 10 numbers after 10, starting from 11."
     messages = history_to_messages(history, system)
+    messages.append({'role': 'user', 'content': query})
+    payload = {"inputs": query, "parameters": {"max_new_tokens": 150}, "history": messages}
+    headers = {"Authorization": f"Bearer {os.getenv('HF_TOKEN')}"}
     try:
+        response = requests.post(f"https://api-inference.huggingface.co/models/Qwen/Qwen2.5-72B-Instruct",
+                                 json=payload, headers=headers)
+        if response.status_code == 200:
+            response_data = response.json()
+            if isinstance(response_data, list):
+                response_text = response_data[0].get('generated_text', '')
             else:
+                response_text = response_data.get('generated_text', '')
+            # Log the chat to file
+            log_history_to_file(query, response_text)
+            # Update history with the new assistant response and return it
+            history.append([query, response_text])
+            return response_text, history, system
+        else:
+            error_message = f"Error {response.status_code}: {response.json().get('error', response.text)}"
+            log_history_to_file(query, error_message)
+            return error_message, history, system
     except Exception as e:
         error_message = f"Exception: {str(e)}"
         log_history_to_file(query, error_message)
         return error_message, history, system
 # Gradio Interface Setup
 with gr.Blocks() as demo:
     gr.Markdown("<center><font size=8>Qwen2.5-72B-Instruct👾</center>")
         clear_history = gr.Button("🧹 Clear history")
         submit = gr.Button("🚀 Send")
+    # Link buttons to functions
     textbox.submit(model_chat,
                    inputs=[textbox, chatbot, system_state],
                    outputs=[textbox, chatbot, system_input],
 # Launching Gradio Interface with reduced threads for free plan
 demo.queue(api_open=False)
+demo.launch(max_threads=10)"