Update README.md
Browse files
README.md
CHANGED
@@ -46,9 +46,7 @@ def load_model(model_size, model_dir):
|
|
46 |
llama_config = LlamaConfig(**config)
|
47 |
model = LlamaForCausalLM(llama_config).to('cuda')
|
48 |
tokenizer = AutoTokenizer.from_pretrained('meta-llama/Llama-2-7b-hf', padding_side="right", use_fast=False)
|
49 |
-
|
50 |
-
if exist_extra_para:
|
51 |
-
model = replace_with_learnable_binarylinear(model, scaling_pattern = "column", keep_parts = ["lm_head"])
|
52 |
|
53 |
weight_dict = {}
|
54 |
ckpt_plist = [p for p in model_dir.iterdir() if p.suffix == '.bin']
|
|
|
46 |
llama_config = LlamaConfig(**config)
|
47 |
model = LlamaForCausalLM(llama_config).to('cuda')
|
48 |
tokenizer = AutoTokenizer.from_pretrained('meta-llama/Llama-2-7b-hf', padding_side="right", use_fast=False)
|
49 |
+
model = replace_with_learnable_binarylinear(model, scaling_pattern = "column", keep_parts = ["lm_head"])
|
|
|
|
|
50 |
|
51 |
weight_dict = {}
|
52 |
ckpt_plist = [p for p in model_dir.iterdir() if p.suffix == '.bin']
|