Spaces:
Running
on
T4
Running
on
T4
ffreemt
commited on
Commit
·
56ad8d6
1
Parent(s):
5f4757d
Back to Qwen/Qwen-7B-Chat
Browse files
app.py
CHANGED
@@ -60,8 +60,8 @@ except Exception:
|
|
60 |
# Windows
|
61 |
logger.warning("Windows, cant run time.tzset()")
|
62 |
|
63 |
-
model_name = "Qwen/Qwen-7B-Chat" # gone!
|
64 |
model_name = "tangger/Qwen-7B-Chat" # try
|
|
|
65 |
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
|
66 |
|
67 |
n_gpus = torch.cuda.device_count()
|
@@ -82,7 +82,8 @@ def gen_model(model_name: str):
|
|
82 |
model_name,
|
83 |
trust_remote_code=True,
|
84 |
device_map="auto",
|
85 |
-
load_in_4bit=True,
|
|
|
86 |
max_memory=max_memory,
|
87 |
fp16=True,
|
88 |
torch_dtype=torch.float16,
|
|
|
60 |
# Windows
|
61 |
logger.warning("Windows, cant run time.tzset()")
|
62 |
|
|
|
63 |
model_name = "tangger/Qwen-7B-Chat" # try
|
64 |
+
model_name = "Qwen/Qwen-7B-Chat" # gone!
|
65 |
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
|
66 |
|
67 |
n_gpus = torch.cuda.device_count()
|
|
|
82 |
model_name,
|
83 |
trust_remote_code=True,
|
84 |
device_map="auto",
|
85 |
+
# load_in_4bit=True,
|
86 |
+
load_in_8bit=True,
|
87 |
max_memory=max_memory,
|
88 |
fp16=True,
|
89 |
torch_dtype=torch.float16,
|