models: | |
- model: rubricreward/R3-Qwen3-14B-LoRA-4k | |
parameters: | |
weight: 0.4 | |
- model: rubricreward/R3-Qwen3-14B-4k | |
parameters: | |
weight: 0.3 | |
- model: rubricreward/R3-Qwen3-14B-14k | |
parameters: | |
weight: 0.3 | |
merge_method: ties | |
base_model: Qwen/Qwen3-14B | |
lambda: 1.0 | |
dtype: bfloat16 | |