from typing import List , Tuple , Union from web_ui import WebUI import math import os from qwen_agent.agents import Assistant from qwen_agent.gui.gradio import gr def app_gui (): # Define the agent bot = Assistant(llm={ 'model': 'QwQ-32B-preview', #os.environ.get( "MODELNAME" ), 'model_type': 'qwen_dashscope', 'generate_cfg': { 'max_input_tokens': 32768, 'max_retries': 10, 'temperature': float (os.environ.get( "T", 0.001 )), 'repetition_penalty': float (os.environ.get( "R", 1.0 )), "top_k": int (os.environ.get( "K", 20 )), "top_p": float (os.environ.get( "P", 0.8 )), }}, name = 'QwQ-32B-preview', description= 'QwQ-32B-Preview is an experimental research model developed by the Qwen Team, focused on advancing AI reasoning capabilities. As a preview release, it demonstrates promising analytical abilities while having several important limitations such as code switching and recursive reasoning loops. Only single-turn queries are supported in this demo.' , system_message= 'You are a helpful and harmless assistant. You are Qwen developed by Alibaba. You should think step-by-step.' , rag_cfg={ 'max_ref_token' : 32768 , 'rag_searchers' : []}, ) chatbot_config = { 'input.placeholder': "Type \"/clear\" to clear the history", 'verbose': True, 'prompt.suggestions': [ { 'text': 'How many r in strawberry' }, { 'text': 'Find the least odd prime factor of $2019^8+1$.' }, ] } WebUI(bot, chatbot_config=chatbot_config).run(concurrency_limit=80) if __name__ == '__main__' : app_gui()