models: | |
- model: tanliboy/lambda-qwen2.5-14b-dpo-test | |
parameters: | |
density: 1 | |
weight: 1 | |
lambda: 0.9 | |
merge_method: della | |
base_model: Qwen/Qwen2.5-14B-Instruct | |
parameters: | |
density: 1 | |
weight: 1 | |
lambda: 0.9 | |
normalize: true | |
int8_mask: true | |
dtype: float16 | |
tokenizer_source: base |