dtype: float16 | |
merge_method: linear | |
slices: | |
- sources: | |
- layer_range: [0, 32] | |
model: Alelcv27/llama3-8b-code-dpo | |
parameters: | |
weight: 0.5 | |
- layer_range: [0, 32] | |
model: Alelcv27/llama3-8b-math-dpo | |
parameters: | |
weight: 0.5 |
dtype: float16 | |
merge_method: linear | |
slices: | |
- sources: | |
- layer_range: [0, 32] | |
model: Alelcv27/llama3-8b-code-dpo | |
parameters: | |
weight: 0.5 | |
- layer_range: [0, 32] | |
model: Alelcv27/llama3-8b-math-dpo | |
parameters: | |
weight: 0.5 |