TheBloke commited on
Commit
7048b2a
1 Parent(s): fefa499

Update for Transformers AWQ support

Browse files
Files changed (1) hide show
  1. config.json +9 -2
config.json CHANGED
@@ -21,5 +21,12 @@
21
  "torch_dtype": "bfloat16",
22
  "transformers_version": "4.34.0.dev0",
23
  "use_cache": true,
24
- "vocab_size": 32002
25
- }
 
 
 
 
 
 
 
 
21
  "torch_dtype": "bfloat16",
22
  "transformers_version": "4.34.0.dev0",
23
  "use_cache": true,
24
+ "vocab_size": 32002,
25
+ "quantization_config": {
26
+ "quant_method": "awq",
27
+ "zero_point": true,
28
+ "group_size": 128,
29
+ "bits": 4,
30
+ "version": "gemm"
31
+ }
32
+ }