merge_method: linear | |
dtype: float32 | |
out_dtype: bfloat16 | |
models: | |
- model: /Users/jsarnecki/opt/Workspace/meta-llama/Llama-3.1-8B | |
parameters: | |
weight: 1.0 | |
- model: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
parameters: | |
weight: 0.0 | |
tokenizer: | |
source: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
tokens: | |
<|start_header_id|>: | |
source: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
force: true | |
<|end_header_id|>: | |
source: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
force: true | |
<|eot_id|>: | |
source: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
force: true | |
<|begin_of_text|>: | |
source: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
force: true | |
<|end_of_text|>: | |
source: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
force: true | |
<|im_start|>: | |
source: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
force: true | |
<|im_end|>: | |
source: /Users/jsarnecki/opt/Workspace/NousResearch/Hermes-3-Llama-3.1-8B | |
force: true | |