dtype: bfloat16 merge_method: passthrough slices: - sources: - layer_range: [0, 24] model: chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO - sources: - layer_range: [8, 24] model: chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO parameters: scale: - filter: o_proj value: 0.0 - filter: down_proj value: 0.0 - value: 1.0 - sources: - layer_range: [8, 24] model: chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO parameters: scale: - filter: o_proj value: 0.0 - filter: down_proj value: 0.0 - value: 1.0 - sources: - layer_range: [24, 32] model: chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO