| # merge_ties.yml | |
| # 1. Overall merge method: TIES (sign-elect sparse task arithmetic) | |
| merge_method: ties | |
| # 2. Base model (all task vectors are computed relative to this checkpoint) | |
| base_model: unsloth/DeepSeek-R1-Distill-Qwen-7B | |
| # 3. Full models to merge (base first, then others) | |
| models: | |
| - model: unsloth/DeepSeek-R1-Distill-Qwen-7B # base has no extra params | |
| - model: nvidia/AceMath-7B-Instruct | |
| parameters: | |
| weight: 0.7 | |
| density: 0.7 | |
| - model: Qwen/Qwen2.5-Math-7B-Instruct | |
| parameters: | |
| weight: 0.3 | |
| density: 0.7 | |
| # 4. Global merge parameters | |
| parameters: | |
| normalize: true # normalize weights across models | |
| int8_mask: true # mask small values when using int8 backing | |
| # 5. Data type for merged tensors | |
| dtype: bfloat16 | |