yahavb commited on
Commit
654bca1
·
verified ·
1 Parent(s): b3482a8

Create infer.py

Browse files
Files changed (1) hide show
  1. infer.py +14 -0
infer.py ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ from optimum.neuron import NeuronModelForCausalLM
3
+ from transformers import AutoTokenizer
4
+ model_id="deepseek-ai/DeepSeek-R1-Distill-Llama-70B"
5
+ prompt="Who are you? what is the model that powers you?"
6
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
7
+ tokenizer.pad_token_id = tokenizer.eos_token_id if tokenizer.pad_token_id is None else tokenizer.pad_token_id
8
+ inputs = tokenizer(prompt, return_tensors="pt")
9
+ model = NeuronModelForCausalLM.from_pretrained("yahavb/DeepSeek-R1-Distill-Llama-70B-Neuron")
10
+ for i in range(10):
11
+ outputs = model.generate(**inputs,max_new_tokens=512,do_sample=True,use_cache=True,temperature=0.7,top_k=50,top_p=0.9)
12
+ outputs=outputs[0, inputs.input_ids.size(-1):]
13
+ response=tokenizer.decode(outputs, skip_special_tokens=True)
14
+ print(response)