nm-testing
/

starcoderbase-1b-pruned50-quant

Text Generation

text-generation-inference

Model card Files Files and versions Community

starcoderbase-1b-pruned50-quant / recipe.yaml

mgoin's picture

Upload folder using huggingface_hub

4a0820f verified about 1 year ago

history blame contribute delete

948 Bytes

	test_stage:
	obcq_modifiers:
	LogarithmicEqualizationModifier:
	mappings:
	- - - re:.*c_attn
	- re:.*ln_1
	- - - re:.*c_fc
	- re:.*ln_2
	QuantizationModifier:
	ignore:
	- Dropout
	- LayerNorm
	- PytorchGELUTanh
	- transformer.h.10.mlp.c_fc
	- transformer.h.13.mlp.c_fc
	- transformer.h.15.mlp.c_fc
	- transformer.h.14.mlp.c_fc
	- transformer.h.17.mlp.c_fc
	post_oneshot_calibration: true
	scheme_overrides:
	Linear:
	weights:
	num_bits: 8
	symmetric: true
	strategy: channel
	Embedding:
	input_activations: null
	weights:
	num_bits: 8
	symmetric: false
	SparseGPTModifier:
	sparsity: 0.5
	block_size: 128
	sequential_update: true
	quantize: true
	percdamp: 0.01
	mask_structure: 0:0
	targets:
	- re:transformer.h.\d*$