rodrigomasini commited on
Commit
cd664b9
·
1 Parent(s): 112a0e5

Update app_v2.py

Browse files
Files changed (1) hide show
  1. app_v2.py +1 -1
app_v2.py CHANGED
@@ -18,7 +18,7 @@ model = AutoGPTQForCausalLM.from_quantized(
18
  pretrained_model_dir,
19
  use_safetensors=True,
20
  strict=False,
21
- #model_basename=quantized_model_dir,
22
  device="cuda:0",
23
  trust_remote_code=True,
24
  use_triton=False,
 
18
  pretrained_model_dir,
19
  use_safetensors=True,
20
  strict=False,
21
+ model_basename='Jackson2-4bit-128g-GPTQ.safetensors',
22
  device="cuda:0",
23
  trust_remote_code=True,
24
  use_triton=False,