merge_method: linear | |
base_model: ./Qwen3-32B-Upscaled | |
dtype: bfloat16 | |
slices: | |
- merge_method: linear | |
sources: | |
- model: ./Qwen3-32B-Upscaled | |
layer_range: [0, 32] | |
parameters: | |
weight: 0.5 | |
- model: ./Qwen2.5-72B-Instruct-Aligned | |
layer_range: [0, 32] | |
parameters: | |
weight: 0.5 | |
- merge_method: linear | |
sources: | |
- model: ./Qwen3-32B-Upscaled | |
layer_range: [32, 48] | |
parameters: | |
weight: 0.0 | |
- model: ./Qwen2.5-72B-Instruct-Aligned | |
layer_range: [32, 48] | |
parameters: | |
weight: 1.0 | |
- merge_method: linear | |
sources: | |
- model: ./Qwen3-32B-Upscaled | |
layer_range: [32, 64] | |
parameters: | |
weight: 0.5 | |
- model: ./Qwen2.5-72B-Instruct-Aligned | |
layer_range: [48, 80] | |
parameters: | |
weight: 0.5 | |
tokenizer_source: ./Qwen3-32B-Upscaled | |