Create infer.py
Browse files
infer.py
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import torch
|
2 |
+
from optimum.neuron import NeuronModelForCausalLM
|
3 |
+
from transformers import AutoTokenizer
|
4 |
+
model_id="deepseek-ai/DeepSeek-R1-Distill-Llama-70B"
|
5 |
+
prompt="Who are you? what is the model that powers you?"
|
6 |
+
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
7 |
+
tokenizer.pad_token_id = tokenizer.eos_token_id if tokenizer.pad_token_id is None else tokenizer.pad_token_id
|
8 |
+
inputs = tokenizer(prompt, return_tensors="pt")
|
9 |
+
model = NeuronModelForCausalLM.from_pretrained("yahavb/DeepSeek-R1-Distill-Llama-70B-Neuron")
|
10 |
+
for i in range(10):
|
11 |
+
outputs = model.generate(**inputs,max_new_tokens=512,do_sample=True,use_cache=True,temperature=0.7,top_k=50,top_p=0.9)
|
12 |
+
outputs=outputs[0, inputs.input_ids.size(-1):]
|
13 |
+
response=tokenizer.decode(outputs, skip_special_tokens=True)
|
14 |
+
print(response)
|