slices: | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 0 | |
- 4 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 3 | |
- 4 | |
parameters: | |
scale: | |
- filter: o_proj | |
value: 0 | |
- filter: down_proj | |
value: 0 | |
- value: 1 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 4 | |
- 8 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 7 | |
- 8 | |
parameters: | |
scale: | |
- filter: o_proj | |
value: 0 | |
- filter: down_proj | |
value: 0 | |
- value: 1 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 8 | |
- 12 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 11 | |
- 12 | |
parameters: | |
scale: | |
- filter: o_proj | |
value: 0 | |
- filter: down_proj | |
value: 0 | |
- value: 1 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 12 | |
- 16 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 15 | |
- 16 | |
parameters: | |
scale: | |
- filter: o_proj | |
value: 0 | |
- filter: down_proj | |
value: 0 | |
- value: 1 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 16 | |
- 20 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 19 | |
- 20 | |
parameters: | |
scale: | |
- filter: o_proj | |
value: 0 | |
- filter: down_proj | |
value: 0 | |
- value: 1 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 20 | |
- 24 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 23 | |
- 24 | |
parameters: | |
scale: | |
- filter: o_proj | |
value: 0 | |
- filter: down_proj | |
value: 0 | |
- value: 1 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 24 | |
- 28 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 27 | |
- 28 | |
parameters: | |
scale: | |
- filter: o_proj | |
value: 0 | |
- filter: down_proj | |
value: 0 | |
- value: 1 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 28 | |
- 32 | |
- sources: | |
- model: arcee-ai/Patent-Instruct-7b | |
layer_range: | |
- 31 | |
- 32 | |
parameters: | |
scale: | |
- filter: o_proj | |
value: 0 | |
- filter: down_proj | |
value: 0 | |
- value: 1 | |
merge_method: passthrough | |
dtype: bfloat16 | |