avanish07 commited on
Commit
12ac526
·
1 Parent(s): d02a246

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -2
app.py CHANGED
@@ -25,7 +25,7 @@ from IPython.display import Markdown, display
25
  peft_model_id = "./"
26
  config = PeftConfig.from_pretrained(peft_model_id)
27
 
28
- bnb_config = BitsAndBytesConfig(
29
  load_in_8bit_fp32_cpu_offload=True,
30
  bnb_8bit_use_fp16=False,
31
  load_in_4bit=True,
@@ -34,11 +34,19 @@ bnb_config = BitsAndBytesConfig(
34
  bnb_4bit_compute_dtype=torch.bfloat16
35
  )
36
 
 
 
 
 
 
 
 
 
37
  model = AutoModelForCausalLM.from_pretrained(
38
  config.base_model_name_or_path,
39
  return_dict=True,
40
  quantization_config=bnb_config,
41
- device_map=None,
42
  trust_remote_code=True,
43
  )
44
  tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path)
 
25
  peft_model_id = "./"
26
  config = PeftConfig.from_pretrained(peft_model_id)
27
 
28
+ quantization_config = BitsAndBytesConfig(
29
  load_in_8bit_fp32_cpu_offload=True,
30
  bnb_8bit_use_fp16=False,
31
  load_in_4bit=True,
 
34
  bnb_4bit_compute_dtype=torch.bfloat16
35
  )
36
 
37
+ device_map = {
38
+ "transformer.word_embeddings": "cpu",
39
+ "transformer.word_embeddings_layernorm": "cpu",
40
+ "lm_head": "cpu",
41
+ "transformer.h": "cpu",
42
+ "transformer.ln_f": "cpu",
43
+ }
44
+
45
  model = AutoModelForCausalLM.from_pretrained(
46
  config.base_model_name_or_path,
47
  return_dict=True,
48
  quantization_config=bnb_config,
49
+ device_map=device_map,
50
  trust_remote_code=True,
51
  )
52
  tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path)