kaitchup
/

Qwen2.5-7B-Instruct-gptqmodel-4bit

Text Generation

text-generation-inference

4-bit precision

Model card Files Files and versions Community

bnjmnmarie commited on Feb 4

Commit

a724bb7

·

verified ·

1 Parent(s): 2e8d8a7

Update config.json

Files changed (1) hide show

config.json +18 -17

config.json CHANGED Viewed

@@ -4,23 +4,24 @@
     "Qwen2ForCausalLM"
   ],
   "quantization_config": {
-  "bits": 8,
-  "dynamic": null,
-  "group_size": 128,
-  "desc_act": true,
-  "sym": true,
-  "lm_head": false,
-  "quant_method": "gptq",
-  "checkpoint_format": "gptq",
-  "meta": {
-    "quantizer": [
-      "gptqmodel:1.7.4"
-    ],
-    "uri": "https://github.com/modelcloud/gptqmodel",
-    "damp_percent": 0.01,
-    "damp_auto_increment": 0.0025,
-    "static_groups": false,
-    "true_sequential": true,
   },
   "attention_dropout": 0.0,
   "bos_token_id": 151643,

     "Qwen2ForCausalLM"
   ],
   "quantization_config": {
+    "bits": 4,
+    "dynamic": null,
+    "group_size": 128,
+    "desc_act": true,
+    "sym": true,
+    "lm_head": false,
+    "quant_method": "gptq",
+    "checkpoint_format": "gptq",
+    "meta": {
+      "quantizer": [
+        "gptqmodel:1.7.4"
+      ],
+      "uri": "https://github.com/modelcloud/gptqmodel",
+      "damp_percent": 0.01,
+      "damp_auto_increment": 0.0025,
+      "static_groups": false,
+      "true_sequential": true
+    }
   },
   "attention_dropout": 0.0,
   "bos_token_id": 151643,