base_model: Alelcv27/llama3-8b-math-dpo | |
dtype: float16 | |
merge_method: slerp | |
parameters: | |
t: 0.5 | |
slices: | |
- sources: | |
- layer_range: [0, 32] | |
model: Alelcv27/llama3-8b-math-dpo | |
- layer_range: [0, 32] | |
model: Alelcv27/llama3-8b-code-dpo |
base_model: Alelcv27/llama3-8b-math-dpo | |
dtype: float16 | |
merge_method: slerp | |
parameters: | |
t: 0.5 | |
slices: | |
- sources: | |
- layer_range: [0, 32] | |
model: Alelcv27/llama3-8b-math-dpo | |
- layer_range: [0, 32] | |
model: Alelcv27/llama3-8b-code-dpo |