base_model: | |
model: | |
path: mllm-dev/gpt2_f_experiment_0_1000 | |
dtype: float16 | |
merge_method: dare_ties | |
parameters: | |
normalize: 1.0 | |
slices: | |
- sources: | |
- layer_range: [0, 12] | |
model: | |
model: | |
path: mllm-dev/gpt2_f_experiment_0_1000 | |
- layer_range: [0, 12] | |
model: | |
model: | |
path: mllm-dev/gpt2_f_experiment_1_1000 | |
parameters: | |
density: 0.8 | |
weight: 0.3 | |
- layer_range: [0, 12] | |
model: | |
model: | |
path: mllm-dev/gpt2_f_experiment_2_1000 | |
parameters: | |
density: 0.6 | |
weight: 0.1 | |
- layer_range: [0, 12] | |
model: | |
model: | |
path: mllm-dev/gpt2_f_experiment_3_1000 | |
parameters: | |
density: 0.6 | |
weight: 0.1 | |
- layer_range: [0, 12] | |
model: | |
model: | |
path: mllm-dev/gpt2_f_experiment_4_1000 | |
parameters: | |
density: 0.8 | |
weight: 0.3 |