models: - model: ./karakuri-lm-70b-chat-v0.1 # no parameters necessary for base model - model: ./tulu-2-dpo-70b # follow user intent parameters: density: 1 weight: - filter: mlp.down_proj value: [0.3, 0.25, 0.25, 0.15, 0.1] - filter: mlp.gate_proj value: [0.7, 0.25, 0.5, 0.45, 0.4] - filter: mlp.up_proj value: [0.7, 0.25, 0.5, 0.45, 0.4] - filter: self_attn value: [0.7, 0.25, 0.5, 0.45, 0.4] - value: 0 # fallback for rest of tensors. merge_method: dare_ties base_model: ./karakuri-lm-70b-chat-v0.1 dtype: bfloat16 tokenizer_source: union