reyvan
/

Qwen-7B-8bit

Text Generation

4-bit precision

Model card Files Files and versions Community

reyvan commited on Feb 22, 2024

Commit

94165f4

·

verified ·

1 Parent(s): 045dc76

Upload 3 files

Files changed (2) hide show

config.json +1 -1
quantize_config.json +1 -1

config.json CHANGED Viewed

@@ -30,7 +30,7 @@
     "group_size": 128,
     "is_marlin_format": false,
     "model_file_base_name": "gptq_model-4bit-128g",
-    "model_name_or_path": "Qwen-7B-4bit",
     "quant_method": "gptq",
     "static_groups": false,
     "sym": true,

     "group_size": 128,
     "is_marlin_format": false,
     "model_file_base_name": "gptq_model-4bit-128g",
+    "model_name_or_path": "Qwen-7B-125m-4bit-128g",
     "quant_method": "gptq",
     "static_groups": false,
     "sym": true,

quantize_config.json CHANGED Viewed

@@ -6,7 +6,7 @@
   "static_groups": false,
   "sym": true,
   "true_sequential": true,
-  "model_name_or_path": "Qwen-7B-4bit",
   "model_file_base_name": "gptq_model-4bit-128g",
   "is_marlin_format": false,
   "quant_method": "gptq"

   "static_groups": false,
   "sym": true,
   "true_sequential": true,
+  "model_name_or_path": "Qwen-7B-125m-4bit-128g",
   "model_file_base_name": "gptq_model-4bit-128g",
   "is_marlin_format": false,
   "quant_method": "gptq"