binqiangliu commited on
Commit
0266d0b
Β·
1 Parent(s): 42d6a0b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -1
app.py CHANGED
@@ -15,10 +15,13 @@ use_triton = False
15
 
16
  tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, use_fast=True)
17
 
 
 
18
  model = AutoGPTQForCausalLM.from_quantized(model_name_or_path,
19
  use_safetensors=True,
20
  #device="cuda:0",
21
- device_map="auto",
 
22
  use_triton=use_triton,
23
  quantize_config=None)
24
 
 
15
 
16
  tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, use_fast=True)
17
 
18
+ device="cuda" if torch.cuda.is_available() else "cpu"):
19
+
20
  model = AutoGPTQForCausalLM.from_quantized(model_name_or_path,
21
  use_safetensors=True,
22
  #device="cuda:0",
23
+ device=device,
24
+ #device_map="auto",
25
  use_triton=use_triton,
26
  quantize_config=None)
27