| models: | |
| - model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B | |
| - model: Sao10K/L3-8B-Stheno-v3.2 | |
| merge_method: slerp | |
| base_model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B | |
| dtype: bfloat16 | |
| parameters: | |
| t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers | |