Rasphi-MoE-Instruct-Unfinetuned / model.safetensors.index.json
QuietImpostor's picture
Upload Rasphi
90b90f6 verified
raw
history blame
220 kB
{
"metadata": {
"format": "pt"
},
"weight_map": {
"lm_head.bias": "model-00000-of-00008.safetensors",
"lm_head.weight": "model-00000-of-00008.safetensors",
"model.reasoning_embed_tokens.weight": "model-00000-of-00008.safetensors",
"model.content_embed_tokens.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.0.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.0.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.0.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.0.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.0.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.0.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.1.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.1.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.1.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.1.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.1.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.1.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.2.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.2.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.2.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.2.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.2.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.2.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.3.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.3.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.3.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.3.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.3.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.3.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.4.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.4.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.4.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.4.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.4.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.4.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.5.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.5.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.5.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.5.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.5.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.5.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.6.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.6.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.6.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.6.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.6.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.6.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.7.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.7.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.7.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.7.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.experts.7.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.experts.7.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_moe.gate.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_moe.gate.weight": "model-00000-of-00008.safetensors",
"model.layers.0.input_reasoning_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.0.input_content_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.0.input_reasoning_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.0.input_content_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.0.post_attention_reasoning_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.0.post_attention_content_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.0.post_attention_reasoning_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.0.post_attention_content_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_self_attn.k_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.0.content_self_attn.k_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_self_attn.k_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_self_attn.k_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_self_attn.o_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.0.content_self_attn.o_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_self_attn.o_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_self_attn.o_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_self_attn.q_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.0.content_self_attn.q_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_self_attn.q_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_self_attn.q_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_self_attn.v_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.0.content_self_attn.v_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.0.reasoning_self_attn.v_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.0.content_self_attn.v_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.0.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.0.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.0.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.0.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.0.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.0.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.1.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.1.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.1.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.1.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.1.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.1.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.2.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.2.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.2.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.2.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.2.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.2.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.3.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.3.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.3.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.3.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.3.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.3.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.4.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.4.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.4.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.4.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.4.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.4.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.5.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.5.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.5.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.5.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.5.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.5.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.6.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.6.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.6.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.6.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.6.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.6.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.7.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.7.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.7.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.7.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.experts.7.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.experts.7.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_moe.gate.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_moe.gate.weight": "model-00000-of-00008.safetensors",
"model.layers.1.input_reasoning_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.1.input_content_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.1.input_reasoning_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.1.input_content_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.1.post_attention_reasoning_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.1.post_attention_content_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.1.post_attention_reasoning_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.1.post_attention_content_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_self_attn.k_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.1.content_self_attn.k_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_self_attn.k_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_self_attn.k_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_self_attn.o_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.1.content_self_attn.o_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_self_attn.o_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_self_attn.o_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_self_attn.q_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.1.content_self_attn.q_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_self_attn.q_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_self_attn.q_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_self_attn.v_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.1.content_self_attn.v_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.1.reasoning_self_attn.v_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.1.content_self_attn.v_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.0.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.0.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.0.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.0.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.0.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.0.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.1.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.1.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.1.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.1.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.1.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.1.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.2.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.2.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.2.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.2.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.2.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.2.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.3.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.3.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.3.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.3.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.3.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.3.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.4.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.4.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.4.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.4.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.4.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.4.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.5.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.5.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.5.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.5.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.5.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.5.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.6.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.6.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.6.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.6.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.6.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.6.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.7.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.7.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.7.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.7.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.experts.7.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.experts.7.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_moe.gate.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_moe.gate.weight": "model-00000-of-00008.safetensors",
"model.layers.10.input_reasoning_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.10.input_content_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.10.input_reasoning_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.10.input_content_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.10.post_attention_reasoning_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.10.post_attention_content_layernorm.bias": "model-00000-of-00008.safetensors",
"model.layers.10.post_attention_reasoning_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.10.post_attention_content_layernorm.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_self_attn.k_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.10.content_self_attn.k_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_self_attn.k_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_self_attn.k_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_self_attn.o_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.10.content_self_attn.o_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_self_attn.o_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_self_attn.o_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_self_attn.q_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.10.content_self_attn.q_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_self_attn.q_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_self_attn.q_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_self_attn.v_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.10.content_self_attn.v_proj.bias": "model-00000-of-00008.safetensors",
"model.layers.10.reasoning_self_attn.v_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.10.content_self_attn.v_proj.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.0.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.0.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.0.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.0.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.0.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.0.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.1.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.1.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.1.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.1.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.1.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.1.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.2.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.2.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.2.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.2.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.2.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.2.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.3.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.3.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.3.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.3.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.3.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.3.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.4.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.4.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.4.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.4.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.4.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.4.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.5.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.5.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.5.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.5.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.5.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.5.w3.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.6.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.6.w1.weight": "model-00000-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.6.w2.weight": "model-00000-of-00008.safetensors",
"model.layers.11.content_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.7.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_moe.experts.7.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_moe.experts.7.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_moe.experts.7.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_moe.gate.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_moe.gate.weight": "model-00001-of-00008.safetensors",
"model.layers.11.input_reasoning_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.11.input_content_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.11.input_reasoning_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.11.input_content_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.11.post_attention_reasoning_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.11.post_attention_content_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.11.post_attention_reasoning_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.11.post_attention_content_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_self_attn.k_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.11.content_self_attn.k_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_self_attn.k_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_self_attn.k_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_self_attn.o_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.11.content_self_attn.o_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_self_attn.o_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_self_attn.o_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_self_attn.q_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.11.content_self_attn.q_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_self_attn.q_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_self_attn.q_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_self_attn.v_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.11.content_self_attn.v_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.11.reasoning_self_attn.v_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.11.content_self_attn.v_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.0.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.0.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.0.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.0.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.0.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.0.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.1.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.1.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.1.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.1.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.1.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.1.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.2.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.2.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.2.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.2.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.2.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.2.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.3.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.3.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.3.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.3.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.3.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.3.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.4.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.4.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.4.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.4.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.4.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.4.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.5.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.5.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.5.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.5.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.5.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.5.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.6.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.6.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.7.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.7.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.experts.7.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.experts.7.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_moe.gate.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_moe.gate.weight": "model-00001-of-00008.safetensors",
"model.layers.12.input_reasoning_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.12.input_content_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.12.input_reasoning_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.12.input_content_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.12.post_attention_reasoning_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.12.post_attention_content_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.12.post_attention_reasoning_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.12.post_attention_content_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_self_attn.k_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.12.content_self_attn.k_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_self_attn.k_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_self_attn.k_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_self_attn.o_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.12.content_self_attn.o_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_self_attn.o_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_self_attn.o_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_self_attn.q_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.12.content_self_attn.q_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_self_attn.q_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_self_attn.q_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_self_attn.v_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.12.content_self_attn.v_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.12.reasoning_self_attn.v_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.12.content_self_attn.v_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.0.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.0.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.0.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.0.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.0.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.0.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.1.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.1.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.1.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.1.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.1.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.1.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.2.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.2.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.2.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.2.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.2.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.2.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.3.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.3.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.3.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.3.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.3.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.3.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.4.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.4.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.4.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.4.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.4.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.4.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.5.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.5.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.5.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.5.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.5.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.5.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.6.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.6.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.7.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.7.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.experts.7.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.experts.7.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_moe.gate.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_moe.gate.weight": "model-00001-of-00008.safetensors",
"model.layers.13.input_reasoning_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.13.input_content_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.13.input_reasoning_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.13.input_content_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.13.post_attention_reasoning_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.13.post_attention_content_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.13.post_attention_reasoning_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.13.post_attention_content_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_self_attn.k_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.13.content_self_attn.k_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_self_attn.k_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_self_attn.k_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_self_attn.o_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.13.content_self_attn.o_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_self_attn.o_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_self_attn.o_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_self_attn.q_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.13.content_self_attn.q_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_self_attn.q_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_self_attn.q_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_self_attn.v_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.13.content_self_attn.v_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.13.reasoning_self_attn.v_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.13.content_self_attn.v_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.0.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.0.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.0.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.0.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.0.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.0.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.1.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.1.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.1.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.1.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.1.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.1.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.2.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.2.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.2.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.2.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.2.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.2.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.3.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.3.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.3.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.3.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.3.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.3.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.4.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.4.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.4.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.4.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.4.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.4.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.5.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.5.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.5.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.5.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.5.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.5.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.6.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.6.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.7.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.7.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.experts.7.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.experts.7.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_moe.gate.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_moe.gate.weight": "model-00001-of-00008.safetensors",
"model.layers.14.input_reasoning_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.14.input_content_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.14.input_reasoning_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.14.input_content_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.14.post_attention_reasoning_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.14.post_attention_content_layernorm.bias": "model-00001-of-00008.safetensors",
"model.layers.14.post_attention_reasoning_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.14.post_attention_content_layernorm.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_self_attn.k_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.14.content_self_attn.k_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_self_attn.k_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_self_attn.k_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_self_attn.o_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.14.content_self_attn.o_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_self_attn.o_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_self_attn.o_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_self_attn.q_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.14.content_self_attn.q_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_self_attn.q_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_self_attn.q_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_self_attn.v_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.14.content_self_attn.v_proj.bias": "model-00001-of-00008.safetensors",
"model.layers.14.reasoning_self_attn.v_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.14.content_self_attn.v_proj.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.0.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.0.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.0.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.0.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.0.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.0.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.1.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.1.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.1.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.1.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.1.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.1.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.2.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.2.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.2.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.2.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.2.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.2.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.3.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.3.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.3.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.3.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.3.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.3.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.4.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.4.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.4.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.4.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.4.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.4.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.5.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.5.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.5.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.5.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.5.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.5.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.6.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.6.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.6.w2.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.6.w3.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.content_moe.experts.7.w1.weight": "model-00001-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.15.content_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.15.content_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.15.content_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.15.input_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.15.input_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.15.input_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.15.input_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.15.post_attention_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.15.post_attention_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.15.post_attention_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.15.post_attention_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.15.content_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.15.content_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.15.content_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.15.content_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.15.content_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_self_attn.q_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.15.content_self_attn.q_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_self_attn.v_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.15.content_self_attn.v_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.15.reasoning_self_attn.v_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.15.content_self_attn.v_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.0.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.0.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.0.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.0.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.0.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.0.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.1.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.1.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.1.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.1.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.1.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.1.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.2.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.2.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.2.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.2.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.2.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.2.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.3.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.3.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.3.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.3.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.3.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.3.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.4.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.4.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.4.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.4.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.4.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.4.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.5.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.5.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.5.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.5.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.5.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.5.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.6.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.6.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.6.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.6.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.6.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.6.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.7.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.7.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.16.input_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.16.input_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.16.input_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.16.input_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.16.post_attention_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.16.post_attention_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.16.post_attention_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.16.post_attention_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.16.content_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.16.content_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.16.content_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_self_attn.q_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_self_attn.q_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_self_attn.v_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.16.content_self_attn.v_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.16.reasoning_self_attn.v_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.16.content_self_attn.v_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.0.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.0.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.0.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.0.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.0.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.0.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.1.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.1.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.1.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.1.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.1.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.1.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.2.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.2.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.2.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.2.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.2.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.2.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.3.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.3.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.3.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.3.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.3.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.3.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.4.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.4.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.4.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.4.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.4.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.4.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.5.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.5.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.5.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.5.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.5.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.5.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.6.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.6.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.6.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.6.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.6.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.6.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.7.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.7.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.17.input_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.17.input_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.17.input_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.17.input_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.17.post_attention_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.17.post_attention_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.17.post_attention_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.17.post_attention_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.17.content_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.17.content_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.17.content_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_self_attn.q_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_self_attn.q_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_self_attn.v_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.17.content_self_attn.v_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.17.reasoning_self_attn.v_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.17.content_self_attn.v_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.0.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.0.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.0.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.0.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.0.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.0.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.1.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.1.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.1.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.1.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.1.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.1.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.2.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.2.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.2.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.2.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.2.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.2.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.3.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.3.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.3.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.3.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.3.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.3.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.4.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.4.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.4.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.4.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.4.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.4.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.5.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.5.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.5.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.5.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.5.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.5.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.6.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.6.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.6.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.6.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.6.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.6.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.7.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.7.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.18.input_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.18.input_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.18.input_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.18.input_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.18.post_attention_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.18.post_attention_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.18.post_attention_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.18.post_attention_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.18.content_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.18.content_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.18.content_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_self_attn.q_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_self_attn.q_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_self_attn.v_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.18.content_self_attn.v_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.18.reasoning_self_attn.v_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.18.content_self_attn.v_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.0.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.0.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.0.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.0.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.0.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.0.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.1.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.1.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.1.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.1.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.1.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.1.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.2.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.2.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.2.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.2.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.2.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.2.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.3.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.3.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.3.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.3.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.3.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.3.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.4.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.4.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.4.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.4.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.4.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.4.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.5.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.5.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.5.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.5.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.5.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.5.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.6.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.6.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.6.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.6.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.6.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.6.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.7.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.7.w1.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.7.w2.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.experts.7.w3.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_moe.gate.weight": "model-00002-of-00008.safetensors",
"model.layers.19.input_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.19.input_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.19.input_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.19.input_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.19.post_attention_reasoning_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.19.post_attention_content_layernorm.bias": "model-00002-of-00008.safetensors",
"model.layers.19.post_attention_reasoning_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.19.post_attention_content_layernorm.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.19.content_self_attn.k_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_self_attn.k_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.19.content_self_attn.o_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.19.content_self_attn.o_proj.weight": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.19.content_self_attn.q_proj.bias": "model-00002-of-00008.safetensors",
"model.layers.19.reasoning_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.19.content_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.19.reasoning_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.19.content_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.19.reasoning_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.19.content_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.0.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.0.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.1.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.1.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.1.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.1.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.1.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.1.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.2.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.2.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.2.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.2.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.2.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.2.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.3.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.3.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.3.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.3.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.3.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.3.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.4.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.4.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.4.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.4.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.4.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.4.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.5.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.5.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.5.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.5.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.5.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.5.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.6.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.6.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.6.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.6.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.6.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.6.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.7.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.7.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.7.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.7.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.experts.7.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.experts.7.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_moe.gate.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_moe.gate.weight": "model-00003-of-00008.safetensors",
"model.layers.2.input_reasoning_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.2.input_content_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.2.input_reasoning_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.2.input_content_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.2.post_attention_reasoning_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.2.post_attention_content_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.2.post_attention_reasoning_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.2.post_attention_content_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_self_attn.k_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.2.content_self_attn.k_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_self_attn.k_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_self_attn.k_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_self_attn.o_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.2.content_self_attn.o_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_self_attn.o_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_self_attn.o_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_self_attn.q_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.2.content_self_attn.q_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.2.content_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.2.reasoning_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.2.content_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.0.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.0.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.1.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.1.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.1.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.1.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.1.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.1.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.2.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.2.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.2.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.2.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.2.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.2.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.3.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.3.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.3.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.3.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.3.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.3.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.4.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.4.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.4.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.4.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.4.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.4.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.5.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.5.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.5.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.5.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.5.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.5.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.6.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.6.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.6.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.6.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.6.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.6.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.7.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.7.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.7.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.7.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.experts.7.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.experts.7.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_moe.gate.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_moe.gate.weight": "model-00003-of-00008.safetensors",
"model.layers.20.input_reasoning_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.20.input_content_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.20.input_reasoning_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.20.input_content_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.20.post_attention_reasoning_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.20.post_attention_content_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.20.post_attention_reasoning_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.20.post_attention_content_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_self_attn.k_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.20.content_self_attn.k_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_self_attn.k_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_self_attn.k_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_self_attn.o_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.20.content_self_attn.o_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_self_attn.o_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_self_attn.o_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_self_attn.q_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.20.content_self_attn.q_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.20.content_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.20.reasoning_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.20.content_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.0.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.0.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.1.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.1.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.1.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.1.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.1.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.1.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.2.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.2.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.2.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.2.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.2.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.2.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.3.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.3.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.3.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.3.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.3.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.3.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.4.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.4.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.4.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.4.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.4.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.4.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.5.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.5.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.5.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.5.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.5.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.5.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.6.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.6.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.6.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.6.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.6.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.6.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.7.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.7.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.7.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.7.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.experts.7.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.experts.7.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_moe.gate.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_moe.gate.weight": "model-00003-of-00008.safetensors",
"model.layers.21.input_reasoning_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.21.input_content_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.21.input_reasoning_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.21.input_content_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.21.post_attention_reasoning_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.21.post_attention_content_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.21.post_attention_reasoning_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.21.post_attention_content_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_self_attn.k_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.21.content_self_attn.k_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_self_attn.k_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_self_attn.k_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_self_attn.o_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.21.content_self_attn.o_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_self_attn.o_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_self_attn.o_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_self_attn.q_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.21.content_self_attn.q_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.21.content_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.21.reasoning_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.21.content_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.0.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.0.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.1.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.1.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.1.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.1.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.1.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.1.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.2.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.2.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.2.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.2.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.2.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.2.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.3.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.3.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.3.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.3.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.3.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.3.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.4.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.4.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.4.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.4.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.4.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.4.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.5.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.5.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.5.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.5.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.5.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.5.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.6.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.6.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.6.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.6.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.6.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.6.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.7.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.7.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.7.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.7.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.experts.7.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.experts.7.w3.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_moe.gate.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_moe.gate.weight": "model-00003-of-00008.safetensors",
"model.layers.22.input_reasoning_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.22.input_content_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.22.input_reasoning_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.22.input_content_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.22.post_attention_reasoning_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.22.post_attention_content_layernorm.bias": "model-00003-of-00008.safetensors",
"model.layers.22.post_attention_reasoning_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.22.post_attention_content_layernorm.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_self_attn.k_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.22.content_self_attn.k_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_self_attn.k_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_self_attn.k_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_self_attn.o_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.22.content_self_attn.o_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_self_attn.o_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_self_attn.o_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_self_attn.q_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.22.content_self_attn.q_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_self_attn.q_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.22.content_self_attn.v_proj.bias": "model-00003-of-00008.safetensors",
"model.layers.22.reasoning_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.22.content_self_attn.v_proj.weight": "model-00003-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.23.content_moe.experts.0.w1.weight": "model-00003-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.23.content_moe.experts.0.w2.weight": "model-00003-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.1.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.1.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.2.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.2.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.2.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.2.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.2.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.2.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.3.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.3.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.3.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.3.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.3.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.3.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.4.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.4.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.4.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.4.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.4.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.4.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.5.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.5.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.5.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.5.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.5.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.5.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.6.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.6.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.6.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.6.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.6.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.6.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.7.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.7.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.7.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.7.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.experts.7.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.experts.7.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_moe.gate.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_moe.gate.weight": "model-00004-of-00008.safetensors",
"model.layers.23.input_reasoning_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.23.input_content_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.23.input_reasoning_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.23.input_content_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.23.post_attention_reasoning_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.23.post_attention_content_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.23.post_attention_reasoning_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.23.post_attention_content_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_self_attn.k_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.23.content_self_attn.k_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_self_attn.k_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_self_attn.k_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_self_attn.o_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.23.content_self_attn.o_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_self_attn.o_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_self_attn.o_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_self_attn.q_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.23.content_self_attn.q_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_self_attn.q_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_self_attn.q_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_self_attn.v_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.23.content_self_attn.v_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.23.reasoning_self_attn.v_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.23.content_self_attn.v_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.0.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.0.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.0.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.0.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.1.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.1.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.2.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.2.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.2.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.2.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.2.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.2.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.3.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.3.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.3.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.3.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.3.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.3.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.4.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.4.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.4.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.4.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.4.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.4.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.5.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.5.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.5.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.5.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.5.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.5.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.6.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.6.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.6.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.6.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.6.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.6.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.7.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.7.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.7.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.7.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.experts.7.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.experts.7.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_moe.gate.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_moe.gate.weight": "model-00004-of-00008.safetensors",
"model.layers.24.input_reasoning_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.24.input_content_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.24.input_reasoning_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.24.input_content_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.24.post_attention_reasoning_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.24.post_attention_content_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.24.post_attention_reasoning_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.24.post_attention_content_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_self_attn.k_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.24.content_self_attn.k_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_self_attn.k_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_self_attn.k_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_self_attn.o_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.24.content_self_attn.o_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_self_attn.o_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_self_attn.o_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_self_attn.q_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.24.content_self_attn.q_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_self_attn.q_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_self_attn.q_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_self_attn.v_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.24.content_self_attn.v_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.24.reasoning_self_attn.v_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.24.content_self_attn.v_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.0.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.0.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.0.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.0.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.1.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.1.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.2.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.2.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.2.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.2.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.2.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.2.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.3.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.3.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.3.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.3.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.3.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.3.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.4.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.4.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.4.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.4.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.4.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.4.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.5.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.5.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.5.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.5.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.5.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.5.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.6.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.6.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.6.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.6.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.6.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.6.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.7.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.7.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.7.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.7.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.experts.7.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.experts.7.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_moe.gate.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_moe.gate.weight": "model-00004-of-00008.safetensors",
"model.layers.25.input_reasoning_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.25.input_content_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.25.input_reasoning_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.25.input_content_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.25.post_attention_reasoning_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.25.post_attention_content_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.25.post_attention_reasoning_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.25.post_attention_content_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_self_attn.k_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.25.content_self_attn.k_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_self_attn.k_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_self_attn.k_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_self_attn.o_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.25.content_self_attn.o_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_self_attn.o_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_self_attn.o_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_self_attn.q_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.25.content_self_attn.q_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_self_attn.q_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_self_attn.q_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_self_attn.v_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.25.content_self_attn.v_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.25.reasoning_self_attn.v_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.25.content_self_attn.v_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.0.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.0.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.0.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.0.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.1.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.1.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.2.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.2.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.2.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.2.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.2.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.2.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.3.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.3.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.3.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.3.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.3.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.3.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.4.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.4.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.4.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.4.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.4.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.4.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.5.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.5.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.5.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.5.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.5.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.5.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.6.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.6.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.6.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.6.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.6.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.6.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.7.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.7.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.7.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.7.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.experts.7.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.experts.7.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_moe.gate.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_moe.gate.weight": "model-00004-of-00008.safetensors",
"model.layers.26.input_reasoning_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.26.input_content_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.26.input_reasoning_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.26.input_content_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.26.post_attention_reasoning_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.26.post_attention_content_layernorm.bias": "model-00004-of-00008.safetensors",
"model.layers.26.post_attention_reasoning_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.26.post_attention_content_layernorm.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_self_attn.k_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.26.content_self_attn.k_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_self_attn.k_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_self_attn.k_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_self_attn.o_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.26.content_self_attn.o_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_self_attn.o_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_self_attn.o_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_self_attn.q_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.26.content_self_attn.q_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_self_attn.q_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_self_attn.q_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_self_attn.v_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.26.content_self_attn.v_proj.bias": "model-00004-of-00008.safetensors",
"model.layers.26.reasoning_self_attn.v_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.26.content_self_attn.v_proj.weight": "model-00004-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.0.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.27.content_moe.experts.0.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.0.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.27.content_moe.experts.0.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.27.content_moe.experts.0.w3.weight": "model-00004-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.27.content_moe.experts.1.w1.weight": "model-00004-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.1.w2.weight": "model-00004-of-00008.safetensors",
"model.layers.27.content_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.2.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.2.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.2.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.2.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.3.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.3.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.3.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.3.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.3.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.3.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.4.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.4.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.4.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.4.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.4.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.4.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.5.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.5.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.5.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.5.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.5.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.5.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.6.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.6.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.6.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.6.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.6.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.6.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.7.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.7.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.7.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.7.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.experts.7.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.experts.7.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_moe.gate.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_moe.gate.weight": "model-00005-of-00008.safetensors",
"model.layers.27.input_reasoning_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.27.input_content_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.27.input_reasoning_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.27.input_content_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.27.post_attention_reasoning_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.27.post_attention_content_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.27.post_attention_reasoning_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.27.post_attention_content_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_self_attn.k_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.27.content_self_attn.k_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_self_attn.k_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_self_attn.k_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_self_attn.o_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.27.content_self_attn.o_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_self_attn.o_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_self_attn.o_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_self_attn.q_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.27.content_self_attn.q_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_self_attn.q_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_self_attn.q_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_self_attn.v_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.27.content_self_attn.v_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.27.reasoning_self_attn.v_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.27.content_self_attn.v_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.0.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.0.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.0.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.0.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.0.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.0.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.1.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.1.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.2.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.2.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.2.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.2.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.3.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.3.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.3.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.3.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.3.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.3.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.4.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.4.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.4.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.4.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.4.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.4.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.5.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.5.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.5.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.5.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.5.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.5.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.6.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.6.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.6.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.6.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.6.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.6.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.7.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.7.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.7.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.7.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.experts.7.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.experts.7.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_moe.gate.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_moe.gate.weight": "model-00005-of-00008.safetensors",
"model.layers.28.input_reasoning_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.28.input_content_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.28.input_reasoning_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.28.input_content_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.28.post_attention_reasoning_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.28.post_attention_content_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.28.post_attention_reasoning_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.28.post_attention_content_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_self_attn.k_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.28.content_self_attn.k_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_self_attn.k_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_self_attn.k_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_self_attn.o_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.28.content_self_attn.o_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_self_attn.o_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_self_attn.o_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_self_attn.q_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.28.content_self_attn.q_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_self_attn.q_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_self_attn.q_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_self_attn.v_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.28.content_self_attn.v_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.28.reasoning_self_attn.v_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.28.content_self_attn.v_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.0.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.0.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.0.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.0.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.0.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.0.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.1.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.1.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.2.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.2.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.2.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.2.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.3.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.3.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.3.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.3.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.3.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.3.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.4.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.4.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.4.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.4.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.4.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.4.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.5.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.5.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.5.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.5.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.5.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.5.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.6.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.6.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.6.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.6.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.6.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.6.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.7.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.7.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.7.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.7.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.experts.7.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.experts.7.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_moe.gate.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_moe.gate.weight": "model-00005-of-00008.safetensors",
"model.layers.29.input_reasoning_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.29.input_content_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.29.input_reasoning_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.29.input_content_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.29.post_attention_reasoning_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.29.post_attention_content_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.29.post_attention_reasoning_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.29.post_attention_content_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_self_attn.k_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.29.content_self_attn.k_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_self_attn.k_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_self_attn.k_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_self_attn.o_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.29.content_self_attn.o_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_self_attn.o_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_self_attn.o_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_self_attn.q_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.29.content_self_attn.q_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_self_attn.q_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_self_attn.q_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_self_attn.v_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.29.content_self_attn.v_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.29.reasoning_self_attn.v_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.29.content_self_attn.v_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.0.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.0.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.0.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.0.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.0.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.0.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.1.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.1.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.2.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.2.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.2.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.2.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.3.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.3.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.3.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.3.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.3.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.3.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.4.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.4.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.4.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.4.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.4.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.4.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.5.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.5.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.5.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.5.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.5.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.5.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.6.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.6.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.6.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.6.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.6.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.6.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.7.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.7.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.7.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.7.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.experts.7.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.experts.7.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_moe.gate.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_moe.gate.weight": "model-00005-of-00008.safetensors",
"model.layers.3.input_reasoning_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.3.input_content_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.3.input_reasoning_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.3.input_content_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.3.post_attention_reasoning_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.3.post_attention_content_layernorm.bias": "model-00005-of-00008.safetensors",
"model.layers.3.post_attention_reasoning_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.3.post_attention_content_layernorm.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_self_attn.k_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.3.content_self_attn.k_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_self_attn.k_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_self_attn.k_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_self_attn.o_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.3.content_self_attn.o_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_self_attn.o_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_self_attn.o_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_self_attn.q_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.3.content_self_attn.q_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_self_attn.q_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_self_attn.q_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_self_attn.v_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.3.content_self_attn.v_proj.bias": "model-00005-of-00008.safetensors",
"model.layers.3.reasoning_self_attn.v_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.3.content_self_attn.v_proj.weight": "model-00005-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.0.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.30.content_moe.experts.0.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.0.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.30.content_moe.experts.0.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.0.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.30.content_moe.experts.0.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.1.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.30.content_moe.experts.1.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.30.content_moe.experts.1.w2.weight": "model-00005-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.30.content_moe.experts.1.w3.weight": "model-00005-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.30.content_moe.experts.2.w1.weight": "model-00005-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.3.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.3.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.3.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.3.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.4.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.4.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.4.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.4.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.4.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.4.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.5.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.5.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.5.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.5.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.5.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.5.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.6.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.6.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.6.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.6.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.6.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.6.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.7.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.7.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.7.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.7.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.experts.7.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.experts.7.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_moe.gate.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_moe.gate.weight": "model-00006-of-00008.safetensors",
"model.layers.30.input_reasoning_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.30.input_content_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.30.input_reasoning_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.30.input_content_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.30.post_attention_reasoning_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.30.post_attention_content_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.30.post_attention_reasoning_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.30.post_attention_content_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_self_attn.k_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.30.content_self_attn.k_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_self_attn.k_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_self_attn.k_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_self_attn.o_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.30.content_self_attn.o_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_self_attn.o_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_self_attn.o_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_self_attn.q_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.30.content_self_attn.q_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_self_attn.q_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_self_attn.q_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_self_attn.v_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.30.content_self_attn.v_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.30.reasoning_self_attn.v_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.30.content_self_attn.v_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.0.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.0.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.0.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.0.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.0.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.0.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.1.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.1.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.1.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.1.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.1.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.1.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.2.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.2.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.3.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.3.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.3.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.3.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.4.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.4.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.4.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.4.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.4.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.4.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.5.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.5.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.5.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.5.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.5.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.5.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.6.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.6.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.6.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.6.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.6.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.6.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.7.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.7.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.7.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.7.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.experts.7.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.experts.7.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_moe.gate.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_moe.gate.weight": "model-00006-of-00008.safetensors",
"model.layers.31.input_reasoning_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.31.input_content_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.31.input_reasoning_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.31.input_content_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.31.post_attention_reasoning_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.31.post_attention_content_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.31.post_attention_reasoning_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.31.post_attention_content_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_self_attn.k_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.31.content_self_attn.k_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_self_attn.k_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_self_attn.k_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_self_attn.o_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.31.content_self_attn.o_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_self_attn.o_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_self_attn.o_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_self_attn.q_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.31.content_self_attn.q_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_self_attn.q_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_self_attn.q_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_self_attn.v_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.31.content_self_attn.v_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.31.reasoning_self_attn.v_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.31.content_self_attn.v_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.0.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.0.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.0.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.0.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.0.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.0.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.1.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.1.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.1.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.1.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.1.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.1.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.2.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.2.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.3.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.3.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.3.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.3.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.4.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.4.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.4.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.4.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.4.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.4.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.5.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.5.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.5.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.5.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.5.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.5.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.6.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.6.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.6.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.6.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.6.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.6.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.7.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.7.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.7.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.7.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.experts.7.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.experts.7.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_moe.gate.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_moe.gate.weight": "model-00006-of-00008.safetensors",
"model.layers.4.input_reasoning_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.4.input_content_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.4.input_reasoning_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.4.input_content_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.4.post_attention_reasoning_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.4.post_attention_content_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.4.post_attention_reasoning_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.4.post_attention_content_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_self_attn.k_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.4.content_self_attn.k_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_self_attn.k_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_self_attn.k_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_self_attn.o_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.4.content_self_attn.o_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_self_attn.o_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_self_attn.o_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_self_attn.q_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.4.content_self_attn.q_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_self_attn.q_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_self_attn.q_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_self_attn.v_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.4.content_self_attn.v_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.4.reasoning_self_attn.v_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.4.content_self_attn.v_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.0.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.0.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.0.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.0.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.0.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.0.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.1.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.1.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.1.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.1.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.1.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.1.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.2.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.2.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.3.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.3.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.3.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.3.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.4.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.4.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.4.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.4.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.4.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.4.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.5.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.5.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.5.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.5.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.5.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.5.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.6.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.6.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.6.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.6.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.6.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.6.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.7.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.7.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.7.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.7.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.experts.7.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.experts.7.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_moe.gate.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_moe.gate.weight": "model-00006-of-00008.safetensors",
"model.layers.5.input_reasoning_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.5.input_content_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.5.input_reasoning_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.5.input_content_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.5.post_attention_reasoning_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.5.post_attention_content_layernorm.bias": "model-00006-of-00008.safetensors",
"model.layers.5.post_attention_reasoning_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.5.post_attention_content_layernorm.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_self_attn.k_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.5.content_self_attn.k_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_self_attn.k_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_self_attn.k_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_self_attn.o_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.5.content_self_attn.o_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_self_attn.o_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_self_attn.o_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_self_attn.q_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.5.content_self_attn.q_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_self_attn.q_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_self_attn.q_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_self_attn.v_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.5.content_self_attn.v_proj.bias": "model-00006-of-00008.safetensors",
"model.layers.5.reasoning_self_attn.v_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.5.content_self_attn.v_proj.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.0.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.0.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.0.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.0.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.0.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.0.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.1.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.1.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.1.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.1.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.1.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.1.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.2.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.2.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.2.w2.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.2.w3.weight": "model-00006-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.3.w1.weight": "model-00006-of-00008.safetensors",
"model.layers.6.content_moe.experts.3.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.3.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.3.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.3.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.3.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.4.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.4.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.4.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.4.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.4.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.4.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.5.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.5.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.5.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.5.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.5.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.5.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.6.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.6.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.6.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.6.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.6.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.6.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.7.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.7.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.7.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.7.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.experts.7.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.experts.7.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_moe.gate.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_moe.gate.weight": "model-00007-of-00008.safetensors",
"model.layers.6.input_reasoning_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.6.input_content_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.6.input_reasoning_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.6.input_content_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.6.post_attention_reasoning_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.6.post_attention_content_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.6.post_attention_reasoning_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.6.post_attention_content_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_self_attn.k_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.6.content_self_attn.k_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_self_attn.k_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_self_attn.k_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_self_attn.o_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.6.content_self_attn.o_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_self_attn.o_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_self_attn.o_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_self_attn.q_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.6.content_self_attn.q_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_self_attn.q_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_self_attn.q_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_self_attn.v_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.6.content_self_attn.v_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.6.reasoning_self_attn.v_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.6.content_self_attn.v_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.0.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.0.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.0.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.0.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.0.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.0.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.1.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.1.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.1.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.1.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.1.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.1.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.2.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.2.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.2.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.2.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.2.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.2.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.3.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.3.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.3.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.3.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.3.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.3.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.4.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.4.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.4.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.4.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.4.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.4.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.5.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.5.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.5.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.5.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.5.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.5.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.6.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.6.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.6.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.6.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.6.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.6.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.7.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.7.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.7.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.7.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.experts.7.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.experts.7.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_moe.gate.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_moe.gate.weight": "model-00007-of-00008.safetensors",
"model.layers.7.input_reasoning_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.7.input_content_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.7.input_reasoning_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.7.input_content_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.7.post_attention_reasoning_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.7.post_attention_content_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.7.post_attention_reasoning_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.7.post_attention_content_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_self_attn.k_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.7.content_self_attn.k_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_self_attn.k_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_self_attn.k_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_self_attn.o_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.7.content_self_attn.o_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_self_attn.o_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_self_attn.o_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_self_attn.q_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.7.content_self_attn.q_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_self_attn.q_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_self_attn.q_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_self_attn.v_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.7.content_self_attn.v_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.7.reasoning_self_attn.v_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.7.content_self_attn.v_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.0.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.0.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.0.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.0.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.0.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.0.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.1.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.1.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.1.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.1.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.1.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.1.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.2.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.2.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.2.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.2.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.2.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.2.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.3.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.3.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.3.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.3.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.3.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.3.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.4.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.4.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.4.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.4.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.4.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.4.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.5.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.5.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.5.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.5.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.5.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.5.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.6.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.6.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.6.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.6.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.6.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.6.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.7.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.7.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.7.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.7.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.experts.7.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.experts.7.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_moe.gate.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_moe.gate.weight": "model-00007-of-00008.safetensors",
"model.layers.8.input_reasoning_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.8.input_content_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.8.input_reasoning_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.8.input_content_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.8.post_attention_reasoning_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.8.post_attention_content_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.8.post_attention_reasoning_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.8.post_attention_content_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_self_attn.k_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.8.content_self_attn.k_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_self_attn.k_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_self_attn.k_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_self_attn.o_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.8.content_self_attn.o_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_self_attn.o_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_self_attn.o_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_self_attn.q_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.8.content_self_attn.q_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_self_attn.q_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_self_attn.q_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_self_attn.v_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.8.content_self_attn.v_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.8.reasoning_self_attn.v_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.8.content_self_attn.v_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.0.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.0.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.0.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.0.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.0.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.0.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.1.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.1.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.1.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.1.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.1.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.1.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.2.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.2.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.2.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.2.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.2.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.2.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.3.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.3.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.3.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.3.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.3.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.3.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.4.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.4.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.4.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.4.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.4.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.4.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.5.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.5.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.5.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.5.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.5.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.5.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.6.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.6.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.6.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.6.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.6.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.6.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.7.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.7.w1.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.7.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.7.w2.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.experts.7.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.experts.7.w3.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_moe.gate.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_moe.gate.weight": "model-00007-of-00008.safetensors",
"model.layers.9.input_reasoning_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.9.input_content_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.9.input_reasoning_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.9.input_content_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.9.post_attention_reasoning_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.9.post_attention_content_layernorm.bias": "model-00007-of-00008.safetensors",
"model.layers.9.post_attention_reasoning_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.9.post_attention_content_layernorm.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_self_attn.k_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.9.content_self_attn.k_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_self_attn.k_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_self_attn.k_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_self_attn.o_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.9.content_self_attn.o_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_self_attn.o_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_self_attn.o_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_self_attn.q_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.9.content_self_attn.q_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_self_attn.q_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_self_attn.q_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_self_attn.v_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.9.content_self_attn.v_proj.bias": "model-00007-of-00008.safetensors",
"model.layers.9.reasoning_self_attn.v_proj.weight": "model-00007-of-00008.safetensors",
"model.layers.9.content_self_attn.v_proj.weight": "model-00007-of-00008.safetensors",
"model.reasoning_norm.bias": "model-00007-of-00008.safetensors",
"model.content_norm.bias": "model-00007-of-00008.safetensors",
"model.reasoning_norm.weight": "model-00007-of-00008.safetensors",
"model.content_norm.weight": "model-00007-of-00008.safetensors"
}
}