| merge_method: sce | |
| models: | |
| - model: Qwen/QwQ-32B | |
| - model: Qwen/Qwen2.5-Coder-32B-Instruct | |
| base_model: Qwen/Qwen2.5-Coder-32B | |
| parameters: | |
| select_topk: 1 | |
| dtype: bfloat16 | |
| tokenizer_source: Qwen/QwQ-32B | |
| normalize: true | |
| int8_mask: true |
| merge_method: sce | |
| models: | |
| - model: Qwen/QwQ-32B | |
| - model: Qwen/Qwen2.5-Coder-32B-Instruct | |
| base_model: Qwen/Qwen2.5-Coder-32B | |
| parameters: | |
| select_topk: 1 | |
| dtype: bfloat16 | |
| tokenizer_source: Qwen/QwQ-32B | |
| normalize: true | |
| int8_mask: true |