slices: | |
- sources: | |
- model: Qwen/Qwen2.5-7B-Instruct | |
layer_range: [0, 7] | |
- model: Qwen/Qwen2.5-Math-7B-Instruct | |
layer_range: [0, 7] | |
parameters: | |
weight: [0, 1] | |
lambda: 0 | |
- sources: | |
- model: Qwen/Qwen2.5-7B-Instruct | |
layer_range: [7, 14] | |
- model: Qwen/Qwen2.5-Math-7B-Instruct | |
layer_range: [7, 14] | |
parameters: | |
weight: [0, 1] | |
lambda: 0.25 | |
- sources: | |
- model: Qwen/Qwen2.5-7B-Instruct | |
layer_range: [14, 21] | |
- model: Qwen/Qwen2.5-Math-7B-Instruct | |
layer_range: [14, 21] | |
parameters: | |
weight: [0, 1] | |
lambda: 0.5 | |
- sources: | |
- model: Qwen/Qwen2.5-7B-Instruct | |
layer_range: [21, 28] | |
- model: Qwen/Qwen2.5-Math-7B-Instruct | |
layer_range: [21, 28] | |
parameters: | |
weight: [0, 1] | |
lambda: 0.75 | |
merge_method: task_arithmetic | |
base_model: Qwen/Qwen2.5-7B-Instruct | |
dtype: float16 | |