ubermenchh commited on
Commit
cde4903
·
1 Parent(s): 6390543

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -66,7 +66,8 @@ bnb_config = transformers.BitsAndBytesConfig(
66
  load_in_4bit=True,
67
  bnb_4bit_quant_type='nf4',
68
  bnb_4bit_use_double_quant=True,
69
- bnb_4bit_compute_dtype=bfloat16
 
70
  )
71
  model_config = transformers.AutoConfig.from_pretrained(model_id, use_auth_token=hf_auth)
72
  model = transformers.AutoModelForCausalLM.from_pretrained(
 
66
  load_in_4bit=True,
67
  bnb_4bit_quant_type='nf4',
68
  bnb_4bit_use_double_quant=True,
69
+ bnb_4bit_compute_dtype=bfloat16,
70
+ load_in_8bit_fp32_cpu_offload=True
71
  )
72
  model_config = transformers.AutoConfig.from_pretrained(model_id, use_auth_token=hf_auth)
73
  model = transformers.AutoModelForCausalLM.from_pretrained(