models: | |
- model: /models/14b-code-execution-15k-400steps-lr1e-5-2-blocks | |
parameters: | |
weight: 0.7 | |
- model: /models/14b-r1-sdg-all-public-2m-8epochs-lr1e-4-minlr1e-7-warm1600 | |
parameters: | |
weight: 0.3 | |
merge_method: linear | |
dtype: bfloat16 |
models: | |
- model: /models/14b-code-execution-15k-400steps-lr1e-5-2-blocks | |
parameters: | |
weight: 0.7 | |
- model: /models/14b-r1-sdg-all-public-2m-8epochs-lr1e-4-minlr1e-7-warm1600 | |
parameters: | |
weight: 0.3 | |
merge_method: linear | |
dtype: bfloat16 |