File size: 415 Bytes
a1e9275 d2910bb a1e9275 d2910bb |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 |
{
"architectures": [
"MistralForCausalLM"
],
"max_position_embeddings": 2048,
"hidden_size": 4096,
"num_attention_heads": 32,
"num_hidden_layers": 32,
"vocab_size": 50257,
"model_type": "mistral", # <- Important key!
"use_cache": true,
"n_head": 32,
"n_layer": 32,
"n_positions": 2048,
"initializer_range": 0.02,
"layer_norm_epsilon": 1e-5,
"attention_probs_dropout_prob": 0.1
}
|