File size: 338 Bytes
83de635
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13

base_model: tokyotech-llm/Llama-3.1-Swallow-8B-Instruct-v0.1
models:
  - model: tokyotech-llm/Llama-3.1-Swallow-8B-Instruct-v0.1
    # No parameters necessary for base model
  - model: NousResearch/Hermes-3-Llama-3.1-8B
    parameters:
      density: 0.525
      weight: 1
merge_method: dare_ties
tokenizer_source: union
dtype: bfloat16