models: | |
- model: Theros/Qwen2.5-ColdBrew-R1-test2 | |
- model: Theros/Qwen2.5-CreativeMix-7B | |
- model: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B | |
parameters: | |
weight: 0.4 | |
base_model: Theros/Qwen2.5-ColdBrew-R1-test | |
merge_method: model_stock | |
parameters: | |
dtype: bfloat16 | |
tokenizer_source: Theros/Qwen2.5-ColdBrew-R1-test2 |