models: | |
- model: kyujinpy/Sakura-SOLAR-Instruct | |
parameters: | |
density: 1.0 | |
weight: 1.0 | |
- model: kyujinpy/Sakura-SOLRCA-Math-Instruct-DPO-v2 | |
parameters: | |
density: 0.5 | |
weight: [0.33, 0.4, 0.33] | |
- model: kyujinpy/Sakura-SOLRCA-Instruct-DPO | |
parameters: | |
density: [0.33, 0.45, 0.66] | |
weight: 0.66 | |
merge_method: dare_ties | |
base_model: kyujinpy/Sakura-SOLAR-Instruct | |
parameters: | |
normalize: true | |
int8_mask: true | |
dtype: bfloat16 | |
tokenizer_source : union | |
#slices: | |
# - sources: | |
# - model: upstage/SOLAR-10.7B-Instruct-v1.0 | |
# layer_range: [0, 48] | |
# - model: beomi/OPEN-SOLAR-KO-10.7B | |
# layer_range: [0, 48] | |
## or, the equivalent models: syntax: | |
## models: | |
## - model: psmathur/orca_mini_v3_13b | |
## - model: garage-bAInd/Platypus2-13B | |
#merge_method: slerp | |
#base_model: upstage/SOLAR-10.7B-Instruct-v1.0 | |
#parameters: | |
# t: | |
# - filter: self_attn | |
# value: [0, 0.5, 0.3, 0.7, 1] | |
# - filter: mlp | |
# value: [1, 0.5, 0.7, 0.3, 0] | |
# - value: 0.5 # fallback for rest of tensors | |
#dtype: float16 |