from huggingface_hub.hf_api import HfFolder from huggingface_hub import login from optimum.neuron import NeuronModelForCausalLM import os hf_token="hf_TBD" sequence_length=256 auto_cast_type="bf16" batch_size=8 num_cores=16 hf_repo="yahavb/DeepSeek-R1-Distill-Llama-70B-Neuron" model_dir="/deepseek-ai/DeepSeek-R1-Distill-Llama-70B" model_id="deepseek-ai/DeepSeek-R1-Distill-Llama-70B" from huggingface_hub.hf_api import HfFolder from huggingface_hub import login from optimum.neuron import NeuronModelForCausalLM login(hf_token,add_to_git_credential=True) compiler_args = {"num_cores": num_cores, "auto_cast_type": auto_cast_type} input_shapes = {"batch_size": batch_size, "sequence_length": sequence_length} model = NeuronModelForCausalLM.from_pretrained( model_id, export=True, **compiler_args, **input_shapes) model.save_pretrained(model_dir) model.push_to_hub(model_dir,repository_id=hf_repo)