rphrp1985 commited on
Commit
bc7e35a
·
verified ·
1 Parent(s): 59f7ef5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -134,6 +134,7 @@ tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
134
  model = AutoModelForCausalLM.from_pretrained(
135
  MODEL_ID,
136
  device_map="auto",
 
137
  quantization_config=quantization_config,
138
  attn_implementation="flash_attention_2",
139
  )
 
134
  model = AutoModelForCausalLM.from_pretrained(
135
  MODEL_ID,
136
  device_map="auto",
137
+ low_cpu_mem_usage=True,
138
  quantization_config=quantization_config,
139
  attn_implementation="flash_attention_2",
140
  )