{ | |
"d_model": 4096, | |
"ssm_cfg": { | |
"expand": 1 | |
}, | |
"rms_norm_eps": 1e-05, | |
"vocab_size": null, | |
"d_xb": 1024, | |
"intermediate_size": 14336, | |
"hidden_act": "silu", | |
"n_layer": 32, | |
"attn_layers": [ | |
3, | |
7, | |
11, | |
15, | |
19, | |
23, | |
27, | |
31 | |
] | |
} |
{ | |
"d_model": 4096, | |
"ssm_cfg": { | |
"expand": 1 | |
}, | |
"rms_norm_eps": 1e-05, | |
"vocab_size": null, | |
"d_xb": 1024, | |
"intermediate_size": 14336, | |
"hidden_act": "silu", | |
"n_layer": 32, | |
"attn_layers": [ | |
3, | |
7, | |
11, | |
15, | |
19, | |
23, | |
27, | |
31 | |
] | |
} |