| base_model: Qwen/Qwen2.5-1.5B-Instruct | |
| dtype: bfloat16 | |
| merge_method: slerp | |
| parameters: | |
| t: 0.1 | |
| slices: | |
| - sources: | |
| - layer_range: [0, 28] | |
| model: Qwen/Qwen2.5-1.5B-Instruct | |
| - layer_range: [0, 28] | |
| model: Qwen/Qwen2.5-Math-1.5B | |
| base_model: Qwen/Qwen2.5-1.5B-Instruct | |
| dtype: bfloat16 | |
| merge_method: slerp | |
| parameters: | |
| t: 0.1 | |
| slices: | |
| - sources: | |
| - layer_range: [0, 28] | |
| model: Qwen/Qwen2.5-1.5B-Instruct | |
| - layer_range: [0, 28] | |
| model: Qwen/Qwen2.5-Math-1.5B | |