Spaces:
Paused
Paused
Commit
·
2280c62
1
Parent(s):
5e9aaf4
Update app_v2.py
Browse files
app_v2.py
CHANGED
@@ -11,7 +11,7 @@ quantized_model_dir = "./Jackson2-4bit-128g-GPTQ"
|
|
11 |
os.makedirs(quantized_model_dir, exist_ok=True)
|
12 |
|
13 |
# Quantization configuration
|
14 |
-
quantize_config = BaseQuantizeConfig(bits=4, group_size=128, desc_act=False)
|
15 |
|
16 |
# Load the model using from_quantized
|
17 |
model = AutoGPTQForCausalLM.from_quantized(
|
|
|
11 |
os.makedirs(quantized_model_dir, exist_ok=True)
|
12 |
|
13 |
# Quantization configuration
|
14 |
+
quantize_config = BaseQuantizeConfig(bits=4, group_size=128, damp_percent=0.01, desc_act=False)
|
15 |
|
16 |
# Load the model using from_quantized
|
17 |
model = AutoGPTQForCausalLM.from_quantized(
|