ffreemt commited on
Commit
56ad8d6
·
1 Parent(s): 5f4757d

Back to Qwen/Qwen-7B-Chat

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -60,8 +60,8 @@ except Exception:
60
  # Windows
61
  logger.warning("Windows, cant run time.tzset()")
62
 
63
- model_name = "Qwen/Qwen-7B-Chat" # gone!
64
  model_name = "tangger/Qwen-7B-Chat" # try
 
65
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
66
 
67
  n_gpus = torch.cuda.device_count()
@@ -82,7 +82,8 @@ def gen_model(model_name: str):
82
  model_name,
83
  trust_remote_code=True,
84
  device_map="auto",
85
- load_in_4bit=True,
 
86
  max_memory=max_memory,
87
  fp16=True,
88
  torch_dtype=torch.float16,
 
60
  # Windows
61
  logger.warning("Windows, cant run time.tzset()")
62
 
 
63
  model_name = "tangger/Qwen-7B-Chat" # try
64
+ model_name = "Qwen/Qwen-7B-Chat" # gone!
65
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
66
 
67
  n_gpus = torch.cuda.device_count()
 
82
  model_name,
83
  trust_remote_code=True,
84
  device_map="auto",
85
+ # load_in_4bit=True,
86
+ load_in_8bit=True,
87
  max_memory=max_memory,
88
  fp16=True,
89
  torch_dtype=torch.float16,