base_model: Qwen/Qwen2.5-14B-Instruct-1M | |
merge_method: passthrough | |
slices: | |
- sources: | |
- model: Qwen/Qwen2.5-14B-Instruct-1M | |
layer_range: [0, 48] | |
- sources: | |
- model: Qwen/Qwen2.5-14B-Instruct-1M | |
layer_range: [0, 48] | |
dtype: bfloat16 | |
base_model: Qwen/Qwen2.5-14B-Instruct-1M | |
merge_method: passthrough | |
slices: | |
- sources: | |
- model: Qwen/Qwen2.5-14B-Instruct-1M | |
layer_range: [0, 48] | |
- sources: | |
- model: Qwen/Qwen2.5-14B-Instruct-1M | |
layer_range: [0, 48] | |
dtype: bfloat16 | |