models: | |
# Pivot model | |
- model: Qwen/Qwen2.5-7B-Instruct-1M | |
# Target models | |
- model: open-r1/OpenR1-Qwen-7B | |
- model: open-thoughts/OpenThinker-7B | |
- model: NovaSky-AI/Sky-T1-mini | |
- model: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B | |
merge_method: sce | |
base_model: Qwen/Qwen2.5-7B-Instruct-1M | |
parameters: | |
select_topk: 1.0 | |
dtype: bfloat16 |