nm-autobot
commited on
Upload folder using huggingface_hub
Browse files- config.json +1 -1
- model.safetensors +1 -1
- recipe.yaml +1 -2
config.json
CHANGED
@@ -51,7 +51,7 @@
|
|
51 |
"quantization_status": "compressed",
|
52 |
"sparsity_config": {
|
53 |
"format": "dense",
|
54 |
-
"global_sparsity": 0.
|
55 |
"ignore": [
|
56 |
"lm_head"
|
57 |
],
|
|
|
51 |
"quantization_status": "compressed",
|
52 |
"sparsity_config": {
|
53 |
"format": "dense",
|
54 |
+
"global_sparsity": 0.45357336616227273,
|
55 |
"ignore": [
|
56 |
"lm_head"
|
57 |
],
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 626506392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd7a041519eb0710a1676020d8bf538f961d7f77bb2392ed001cb0f2bef707c2
|
3 |
size 626506392
|
recipe.yaml
CHANGED
@@ -1,8 +1,7 @@
|
|
1 |
sparsity_stage:
|
2 |
sparsity_modifiers:
|
3 |
SparseGPTModifier: {sparsity: 0.5, mask_structure: '2:4', sequential_update: false}
|
4 |
-
run_type: &id001 !!python/object/apply:
|
5 |
-
ONESHOT]
|
6 |
quantization_stage:
|
7 |
quantization_modifiers:
|
8 |
GPTQModifier:
|
|
|
1 |
sparsity_stage:
|
2 |
sparsity_modifiers:
|
3 |
SparseGPTModifier: {sparsity: 0.5, mask_structure: '2:4', sequential_update: false}
|
4 |
+
run_type: &id001 !!python/object/apply:llmcompressor.recipe.stage.StageRunType [oneshot]
|
|
|
5 |
quantization_stage:
|
6 |
quantization_modifiers:
|
7 |
GPTQModifier:
|