expt with awq
Browse files- config.json +5 -2
config.json
CHANGED
@@ -27,8 +27,11 @@
|
|
27 |
"llm_int8_threshold": 6.0,
|
28 |
"load_in_4bit": true,
|
29 |
"load_in_8bit": false,
|
30 |
-
"
|
31 |
-
"
|
|
|
|
|
|
|
32 |
},
|
33 |
"rms_norm_eps": 1e-05,
|
34 |
"rope_scaling": null,
|
|
|
27 |
"llm_int8_threshold": 6.0,
|
28 |
"load_in_4bit": true,
|
29 |
"load_in_8bit": false,
|
30 |
+
"zero_point": true,
|
31 |
+
"q_group_size": 128,
|
32 |
+
"w_bit": 4,
|
33 |
+
"version": "GEMM",
|
34 |
+
"quant_method": "awq"
|
35 |
},
|
36 |
"rms_norm_eps": 1e-05,
|
37 |
"rope_scaling": null,
|