slices: - sources: - model: FelixChao/WestSeverus-7B-DPO-v2 layer_range: [0, 32] - model: macadeliccc/WestLake-7B-v2-laser-truthy-dpo layer_range: [0, 32] merge_method: slerp base_model: FelixChao/WestSeverus-7B-DPO-v2 parameters: t: - filter: self_attn value: [0, 0.5, 0.3, 0.7, 1] - filter: mlp value: [1, 0.5, 0.7, 0.3, 0] - value: 0.5 dtype: #bfloat16 #bfloat16이 float16보다 학습할때 더 빠릅니다.