zephyr-3b-corrections / lit_config.json
zabirauf
Finetuned model
df4206b
raw
history blame contribute delete
557 Bytes
{"name": "stablelm-zephyr-3b", "hf_config": {"org": "stabilityai", "name": "stablelm-zephyr-3b"}, "block_size": 4096, "vocab_size": 50254, "padding_multiple": 512, "padded_vocab_size": 50304, "n_layer": 32, "n_head": 32, "n_embd": 2560, "rotary_percentage": 0.25, "parallel_residual": false, "bias": false, "lm_head_bias": false, "n_query_groups": 32, "shared_attention_norm": false, "_norm_class": "LayerNorm", "norm_eps": 1e-05, "_mlp_class": "LLaMAMLP", "gelu_approximate": "none", "intermediate_size": 6912, "rope_condense_ratio": 1, "rope_base": 10000}