base_model: Qwen/Qwen2.5-0.5B-Instruct | |
dtype: bfloat16 | |
merge_method: task_arithmetic | |
parameters: | |
normalize: false | |
slices: | |
- sources: | |
- layer_range: [0, 24] | |
model: Qwen/Qwen2.5-0.5B-Instruct | |
- layer_range: [0, 24] | |
model: Qwen/Qwen2.5-0.5B-Instruct | |
parameters: | |
weight: 1.0 | |
- layer_range: [0, 24] | |
model: Qwen/Qwen2-0.5B-Instruct | |
parameters: | |
weight: -1.0 |