| models: | |
| - model: NousResearch/Nous-Hermes-2-Mistral-7B-DPO | |
| - model: mlabonne/AlphaMonarch-7B | |
| merge_method: slerp | |
| base_model: NousResearch/Nous-Hermes-2-Mistral-7B-DPO | |
| dtype: bfloat16 | |
| parameters: | |
| t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers | |