File size: 262 Bytes
6a2ef4f
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
models:
  - model: Qwen/Qwen2.5-Math-1.5B
  - model: Qwen/Qwen2.5-Coder-1.5B
merge_method: slerp
base_model: Qwen/Qwen2.5-Math-1.5B
dtype: bfloat16
parameters:
  t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers