Ngadou's picture
Update app.py
bcb14a1 verified
from typing import List , Tuple , Union
from web_ui import WebUI
import math
import os
from qwen_agent.agents import Assistant
from qwen_agent.gui.gradio import gr
def app_gui ():
# Define the agent
bot = Assistant(llm={
'model': 'QwQ-32B-preview', #os.environ.get( "MODELNAME" ),
'model_type': 'qwen_dashscope',
'generate_cfg': {
'max_input_tokens': 32768,
'max_retries': 10,
'temperature': float (os.environ.get( "T", 0.001 )),
'repetition_penalty': float (os.environ.get( "R", 1.0 )),
"top_k": int (os.environ.get( "K", 20 )),
"top_p": float (os.environ.get( "P", 0.8 )),
}},
name = 'QwQ-32B-preview',
description= 'QwQ-32B-Preview is an experimental research model developed by the Qwen Team, focused on advancing AI reasoning capabilities. As a preview release, it demonstrates promising analytical abilities while having several important limitations such as code switching and recursive reasoning loops. Only single-turn queries are supported in this demo.' ,
system_message= 'You are a helpful and harmless assistant. You are Qwen developed by Alibaba. You should think step-by-step.' ,
rag_cfg={ 'max_ref_token' : 32768 , 'rag_searchers' : []},
)
chatbot_config = {
'input.placeholder': "Type \"/clear\" to clear the history",
'verbose': True,
'prompt.suggestions': [
{
'text': 'How many r in strawberry'
},
{
'text': 'Find the least odd prime factor of $2019^8+1$.'
},
]
}
WebUI(bot, chatbot_config=chatbot_config).run(concurrency_limit=80)
if __name__ == '__main__' :
app_gui()