Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -35,7 +35,7 @@ def respond(
|
|
35 |
messages.append({"role": "user", "content": message})
|
36 |
print(messages)
|
37 |
inputs = tokenizer.apply_chat_template(messages, return_tensors="pt", add_generation_prompt=True, enable_reasoning=enable_reasoning, return_dict=True).to(device)
|
38 |
-
generation_kwargs = dict(inputs, streamer=streamer, max_new_tokens=max_tokens, temperature=temperature, repetition_penalty=repetition_penalty
|
39 |
thread = Thread(target=model.generate, kwargs=generation_kwargs)
|
40 |
|
41 |
thread.start()
|
|
|
35 |
messages.append({"role": "user", "content": message})
|
36 |
print(messages)
|
37 |
inputs = tokenizer.apply_chat_template(messages, return_tensors="pt", add_generation_prompt=True, enable_reasoning=enable_reasoning, return_dict=True).to(device)
|
38 |
+
generation_kwargs = dict(inputs, streamer=streamer, max_new_tokens=max_tokens, temperature=temperature, repetition_penalty=repetition_penalty)
|
39 |
thread = Thread(target=model.generate, kwargs=generation_kwargs)
|
40 |
|
41 |
thread.start()
|