# merge_ties.yml | |
# 1. Overall merge method: TIES (sign-elect sparse task arithmetic) | |
merge_method: ties | |
# 2. Base model (all task vectors are computed relative to this checkpoint) | |
base_model: unsloth/DeepSeek-R1-Distill-Qwen-7B | |
# 3. Full models to merge (base first, then others) | |
models: | |
- model: unsloth/DeepSeek-R1-Distill-Qwen-7B # base has no extra params | |
- model: nvidia/AceMath-7B-Instruct | |
parameters: | |
weight: 0.3 | |
density: 0.7 | |
- model: Qwen/Qwen2.5-Math-7B-Instruct | |
parameters: | |
weight: 0.7 | |
density: 0.7 | |
# 4. Global merge parameters | |
parameters: | |
normalize: true # normalize weights across models | |
int8_mask: true # mask small values when using int8 backing | |
# 5. Data type for merged tensors | |
dtype: bfloat16 | |