base_model: Qwen/Qwen2.5-7B-Instruct | |
dtype: bfloat16 | |
merge_method: slerp | |
parameters: | |
t: 0.1 | |
slices: | |
- sources: | |
- layer_range: [0, 28] | |
model: Qwen/Qwen2.5-7B-Instruct | |
- layer_range: [0, 28] | |
model: Qwen/Qwen2.5-Math-7B |
base_model: Qwen/Qwen2.5-7B-Instruct | |
dtype: bfloat16 | |
merge_method: slerp | |
parameters: | |
t: 0.1 | |
slices: | |
- sources: | |
- layer_range: [0, 28] | |
model: Qwen/Qwen2.5-7B-Instruct | |
- layer_range: [0, 28] | |
model: Qwen/Qwen2.5-Math-7B |