base_model: Qwen/Qwen2.5-0.5B-Instruct | |
dtype: bfloat16 | |
merge_method: task_arithmetic | |
parameters: | |
normalize: true | |
slices: | |
- sources: | |
- layer_range: [0, 24] | |
model: Qwen/Qwen2.5-0.5B-Instruct | |
- layer_range: [0, 24] | |
model: Qwen/Qwen2.5-0.5B-Instruct | |
parameters: | |
weight: [1.0, -1.0, 1.0, -1.0, 1.0] | |
- layer_range: [0, 24] | |
model: Qwen/Qwen2-0.5B-Instruct | |
parameters: | |
weight: [-1.0, 1.0, -1.0, 1.0, -1.0] | |