zhaospei commited on
Commit
9c69fb4
·
verified ·
1 Parent(s): eb3ec06

Upload config

Browse files
Files changed (1) hide show
  1. config.json +11 -13
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "zhaospei/hinny-coder-6.7b-java",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -18,18 +18,16 @@
18
  "num_key_value_heads": 32,
19
  "pretraining_tp": 1,
20
  "quantization_config": {
21
- "_load_in_4bit": false,
22
- "_load_in_8bit": true,
23
- "bnb_4bit_compute_dtype": "float32",
24
- "bnb_4bit_quant_type": "nf4",
25
- "bnb_4bit_use_double_quant": true,
26
- "llm_int8_enable_fp32_cpu_offload": false,
27
- "llm_int8_has_fp16_weight": false,
28
- "llm_int8_skip_modules": null,
29
- "llm_int8_threshold": 6.0,
30
- "load_in_4bit": false,
31
- "load_in_8bit": true,
32
- "quant_method": "bitsandbytes"
33
  },
34
  "rms_norm_eps": 1e-06,
35
  "rope_scaling": {
 
1
  {
2
+ "_name_or_path": "hinny-coder/quant-hinny-coder-6.7b-java",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
18
  "num_key_value_heads": 32,
19
  "pretraining_tp": 1,
20
  "quantization_config": {
21
+ "backend": "llm-awq",
22
+ "bits": 4,
23
+ "do_fuse": false,
24
+ "fuse_max_seq_len": null,
25
+ "group_size": 128,
26
+ "modules_to_fuse": null,
27
+ "modules_to_not_convert": null,
28
+ "quant_method": "awq",
29
+ "version": "gemm",
30
+ "zero_point": true
 
 
31
  },
32
  "rms_norm_eps": 1e-06,
33
  "rope_scaling": {