wejoncy commited on
Commit
fc1d262
1 Parent(s): 84d1f32

update config

Browse files
Files changed (1) hide show
  1. config.json +14 -13
config.json CHANGED
@@ -16,7 +16,16 @@
16
  "num_attention_heads": 40,
17
  "num_hidden_layers": 48,
18
  "num_key_value_heads": 8,
19
- "quant_config": {
 
 
 
 
 
 
 
 
 
20
  "model.layers.0.mlp.down_proj": {
21
  "bias": null,
22
  "enable_norm": true,
@@ -8080,15 +8089,7 @@
8080
  -1,
8081
  8
8082
  ]
8083
- }
8084
- },
8085
- "rms_norm_eps": 1e-06,
8086
- "rope_theta": 1000000.0,
8087
- "sliding_window": null,
8088
- "tie_word_embeddings": false,
8089
- "torch_dtype": "bfloat16",
8090
- "transformers_version": "4.45.1",
8091
- "use_cache": true,
8092
- "use_sliding_window": false,
8093
- "vocab_size": 152064
8094
- }
 
16
  "num_attention_heads": 40,
17
  "num_hidden_layers": 48,
18
  "num_key_value_heads": 8,
19
+ "rms_norm_eps": 1e-06,
20
+ "rope_theta": 1000000.0,
21
+ "sliding_window": null,
22
+ "tie_word_embeddings": false,
23
+ "torch_dtype": "bfloat16",
24
+ "transformers_version": "4.45.1",
25
+ "use_cache": true,
26
+ "use_sliding_window": false,
27
+ "vocab_size": 152064,
28
+ "quantization_config": {
29
  "model.layers.0.mlp.down_proj": {
30
  "bias": null,
31
  "enable_norm": true,
 
8089
  -1,
8090
  8
8091
  ]
8092
+ },
8093
+ "quant_method": "vptq"
8094
+ }
8095
+ }