models: | |
- model: rubricreward/R3-Qwen3-4B-4k | |
parameters: | |
weight: 0.5 | |
- model: rubricreward/R3-Qwen3-4B-14k | |
parameters: | |
weight: 0.5 | |
merge_method: linear | |
dtype: bfloat16 | |
models: | |
- model: rubricreward/R3-Qwen3-4B-4k | |
parameters: | |
weight: 0.5 | |
- model: rubricreward/R3-Qwen3-4B-14k | |
parameters: | |
weight: 0.5 | |
merge_method: linear | |
dtype: bfloat16 | |