File size: 262 Bytes
6a2ef4f |
1 2 3 4 5 6 7 8 9 |
models:
- model: Qwen/Qwen2.5-Math-1.5B
- model: Qwen/Qwen2.5-Coder-1.5B
merge_method: slerp
base_model: Qwen/Qwen2.5-Math-1.5B
dtype: bfloat16
parameters:
t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers
|