Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -25,7 +25,7 @@ from IPython.display import Markdown, display
|
|
25 |
peft_model_id = "./"
|
26 |
config = PeftConfig.from_pretrained(peft_model_id)
|
27 |
|
28 |
-
|
29 |
load_in_8bit_fp32_cpu_offload=True,
|
30 |
bnb_8bit_use_fp16=False,
|
31 |
load_in_4bit=True,
|
@@ -34,11 +34,19 @@ bnb_config = BitsAndBytesConfig(
|
|
34 |
bnb_4bit_compute_dtype=torch.bfloat16
|
35 |
)
|
36 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
37 |
model = AutoModelForCausalLM.from_pretrained(
|
38 |
config.base_model_name_or_path,
|
39 |
return_dict=True,
|
40 |
quantization_config=bnb_config,
|
41 |
-
device_map=
|
42 |
trust_remote_code=True,
|
43 |
)
|
44 |
tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path)
|
|
|
25 |
peft_model_id = "./"
|
26 |
config = PeftConfig.from_pretrained(peft_model_id)
|
27 |
|
28 |
+
quantization_config = BitsAndBytesConfig(
|
29 |
load_in_8bit_fp32_cpu_offload=True,
|
30 |
bnb_8bit_use_fp16=False,
|
31 |
load_in_4bit=True,
|
|
|
34 |
bnb_4bit_compute_dtype=torch.bfloat16
|
35 |
)
|
36 |
|
37 |
+
device_map = {
|
38 |
+
"transformer.word_embeddings": "cpu",
|
39 |
+
"transformer.word_embeddings_layernorm": "cpu",
|
40 |
+
"lm_head": "cpu",
|
41 |
+
"transformer.h": "cpu",
|
42 |
+
"transformer.ln_f": "cpu",
|
43 |
+
}
|
44 |
+
|
45 |
model = AutoModelForCausalLM.from_pretrained(
|
46 |
config.base_model_name_or_path,
|
47 |
return_dict=True,
|
48 |
quantization_config=bnb_config,
|
49 |
+
device_map=device_map,
|
50 |
trust_remote_code=True,
|
51 |
)
|
52 |
tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path)
|