Manojajj commited on
Commit
6f7d7b4
·
verified ·
1 Parent(s): 11985f5

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +57 -0
app.py ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from transformers import AutoModelForCausalLM, AutoTokenizer
3
+ import torch
4
+
5
+ # Load the model and tokenizer
6
+ model_name = "Qwen/Qwen2.5-Coder-32B-Instruct"
7
+ model = AutoModelForCausalLM.from_pretrained(
8
+ model_name,
9
+ torch_dtype="auto",
10
+ device_map="auto"
11
+ )
12
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
13
+
14
+ # Function to interact with the model
15
+ def chat_with_model(user_input):
16
+ prompt = user_input
17
+ messages = [
18
+ {"role": "system", "content": "You are Qwen, created by Alibaba Cloud. You are a helpful assistant."},
19
+ {"role": "user", "content": prompt}
20
+ ]
21
+
22
+ # Use apply_chat_template to format messages for the model
23
+ text = tokenizer.apply_chat_template(
24
+ messages,
25
+ tokenize=False,
26
+ add_generation_prompt=True
27
+ )
28
+
29
+ # Tokenize the input and send it to the model
30
+ model_inputs = tokenizer([text], return_tensors="pt").to(model.device)
31
+
32
+ # Generate the response from the model
33
+ generated_ids = model.generate(
34
+ **model_inputs,
35
+ max_new_tokens=512
36
+ )
37
+
38
+ # Decode the generated response
39
+ generated_ids = [
40
+ output_ids[len(input_ids):] for input_ids, output_ids in zip(model_inputs.input_ids, generated_ids)
41
+ ]
42
+
43
+ response = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
44
+
45
+ return response
46
+
47
+ # Create the Gradio interface
48
+ iface = gr.Interface(
49
+ fn=chat_with_model,
50
+ inputs=gr.Textbox(lines=2, placeholder="Ask me anything..."),
51
+ outputs="text",
52
+ title="Qwen2.5-Coder Chatbot",
53
+ description="A chatbot using Qwen2.5-Coder for code generation, reasoning, and fixing tasks."
54
+ )
55
+
56
+ # Launch the interface
57
+ iface.launch()