models: - model: NousResearch/Nous-Hermes-2-Mistral-7B-DPO - model: mlabonne/AlphaMonarch-7B merge_method: slerp base_model: NousResearch/Nous-Hermes-2-Mistral-7B-DPO dtype: bfloat16 parameters: t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers