File size: 582 Bytes
734c5b7
 
 
 
 
d45aaec
734c5b7
 
d45aaec
 
734c5b7
 
d45aaec
734c5b7
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15

dtype: bfloat16
merge_method: linear
slices:
 - sources:
      - layer_range: [0, 32] # Assuming the first half of the model is more general and can be reduced more
        model: NousResearch/Meta-Llama-3-8B-Instruct
        parameters:
          weight: 1.0 # Reduce the weight of the first half to make room for the second half
      - layer_range: [0, 32] # Assuming the second half of the model is more specialized and can be reduced less
        model: NousResearch/Meta-Llama-3-8B-Instruct
        parameters:
          weight: 1.0 # Maintain the weight of the second half