nm-autobot commited on
Commit
cf51837
·
verified ·
1 Parent(s): ad658e5

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. config.json +2 -2
  2. generation_config.json +1 -1
  3. model.safetensors +1 -1
  4. recipe.yaml +1 -2
config.json CHANGED
@@ -51,7 +51,7 @@
51
  "quantization_status": "compressed",
52
  "sparsity_config": {
53
  "format": "dense",
54
- "global_sparsity": 0.45357314542111843,
55
  "ignore": [
56
  "lm_head"
57
  ],
@@ -67,7 +67,7 @@
67
  "rope_theta": 10000.0,
68
  "tie_word_embeddings": false,
69
  "torch_dtype": "bfloat16",
70
- "transformers_version": "4.47.0",
71
  "use_cache": true,
72
  "vocab_size": 32000
73
  }
 
51
  "quantization_status": "compressed",
52
  "sparsity_config": {
53
  "format": "dense",
54
+ "global_sparsity": 0.45357336616227273,
55
  "ignore": [
56
  "lm_head"
57
  ],
 
67
  "rope_theta": 10000.0,
68
  "tie_word_embeddings": false,
69
  "torch_dtype": "bfloat16",
70
+ "transformers_version": "4.47.1",
71
  "use_cache": true,
72
  "vocab_size": 32000
73
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "eos_token_id": 2,
4
  "max_length": 2048,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.47.0"
7
  }
 
3
  "eos_token_id": 2,
4
  "max_length": 2048,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.47.1"
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf5127ce6ddab4186b303b90b89201d53ccce52a214ba34ae704a72509dbe6a3
3
  size 626506392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd7a041519eb0710a1676020d8bf538f961d7f77bb2392ed001cb0f2bef707c2
3
  size 626506392
recipe.yaml CHANGED
@@ -1,8 +1,7 @@
1
  sparsity_stage:
2
  sparsity_modifiers:
3
  SparseGPTModifier: {sparsity: 0.5, mask_structure: '2:4', sequential_update: false}
4
- run_type: &id001 !!python/object/apply:builtins.getattr [!!python/name:llmcompressor.recipe.stage.StageRunType '',
5
- ONESHOT]
6
  quantization_stage:
7
  quantization_modifiers:
8
  GPTQModifier:
 
1
  sparsity_stage:
2
  sparsity_modifiers:
3
  SparseGPTModifier: {sparsity: 0.5, mask_structure: '2:4', sequential_update: false}
4
+ run_type: &id001 !!python/object/apply:llmcompressor.recipe.stage.StageRunType [oneshot]
 
5
  quantization_stage:
6
  quantization_modifiers:
7
  GPTQModifier: