{ | |
"changed": { | |
"vocab_size": { | |
"from": 152064, | |
"to": 151936 | |
}, | |
"_name_or_path": { | |
"from": "Qwen/Qwen2.5-72B-Instruct", | |
"to": "" | |
}, | |
"tie_word_embeddings": { | |
"from": false, | |
"to": true | |
}, | |
"eos_token_id": { | |
"from": 151645, | |
"to": null | |
}, | |
"model_type": { | |
"from": "qwen2", | |
"to": "qwen3" | |
}, | |
"architectures": { | |
"from": [ | |
"Qwen2ForCausalLM" | |
], | |
"to": [ | |
"Qwen3ForCausalLM" | |
] | |
}, | |
"bos_token_id": { | |
"from": 151643, | |
"to": null | |
} | |
}, | |
"added": { | |
"attention_bias": false, | |
"head_dim": 128 | |
}, | |
"removed": {} | |
} |