| models: | |
| - model: tanliboy/lambda-qwen2.5-14b-dpo-test | |
| parameters: | |
| density: 1 | |
| weight: 1 | |
| lambda: 0.9 | |
| merge_method: della | |
| base_model: Qwen/Qwen2.5-14B-Instruct | |
| parameters: | |
| density: 1 | |
| weight: 1 | |
| lambda: 0.9 | |
| normalize: true | |
| int8_mask: true | |
| dtype: float16 | |
| tokenizer_source: base |