Rypo commited on
Commit
93f8de0
·
1 Parent(s): f7884c8

skip norm quantization for numerical stability

Browse files
Files changed (2) hide show
  1. config.json +3 -1
  2. model.safetensors +2 -2
config.json CHANGED
@@ -25,7 +25,9 @@
25
  "bnb_4bit_use_double_quant": false,
26
  "llm_int8_enable_fp32_cpu_offload": false,
27
  "llm_int8_has_fp16_weight": false,
28
- "llm_int8_skip_modules": null,
 
 
29
  "llm_int8_threshold": 6.0,
30
  "load_in_4bit": false,
31
  "load_in_8bit": true,
 
25
  "bnb_4bit_use_double_quant": false,
26
  "llm_int8_enable_fp32_cpu_offload": false,
27
  "llm_int8_has_fp16_weight": false,
28
+ "llm_int8_skip_modules": [
29
+ "norm"
30
+ ],
31
  "llm_int8_threshold": 6.0,
32
  "load_in_4bit": false,
33
  "load_in_8bit": true,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:976985e04c6a7d7a55acc42585adb385cccc8fcfd3bea9b459a44f31fe5874fe
3
- size 4515716454
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:032da9545114d606c57ecc59b236b51681a221ff1e612366a6de63f4d617831f
3
+ size 4091577134