models: | |
- model: PowerInfer/SmallThinker-3B-Preview | |
parameters: | |
density: [1, 0.7, 0.1] # density gradient | |
weight: 1.0 | |
- model: bunnycore/Qwen2.5-3B-RP-Mix | |
parameters: | |
density: 0.5 | |
weight: [0, 0.3, 0.7, 1] # weight gradient | |
- model: Spestly/Athena-1-3B | |
parameters: | |
density: 0.33 | |
weight: | |
- filter: mlp | |
value: 0.5 | |
- value: 0 | |
merge_method: ties | |
base_model: Qwen/Qwen2.5-3B-Instruct | |
parameters: | |
normalize: true | |
int8_mask: true | |
dtype: float16 | |