out_dtype: bfloat16 | |
merge_method: model_stock | |
base_model: meta-llama/Llama-3.1-8B-Instruct | |
models: | |
- model: meta-llama/Llama-3.1-8B | |
- model: arcee-ai/Llama-3.1-SuperNova-Lite | |
- model: deepseek-ai/DeepSeek-R1-Distill-Llama-8B | |
- model: Skywork/Skywork-o1-Open-Llama-3.1-8B | |
- model: AtlaAI/Selene-1-Mini-Llama-3.1-8B | |
- model: ruslandev/llama-3-8b-samantha | |
- model: MathGenie/MathCoder2-Llama-3-8B | |
- model: sethuiyer/Llamaverse-3.1-8B-Instruct | |
- model: NousResearch/Hermes-3-Llama-3.1-8B | |
- model: Casual-Autopsy/L3-Umbral-Mind-RP-v3.0-8B | |
- model: nothingiisreal/L3.1-8B-Celeste-V1.5 | |
- model: Sao10K/L3-8B-Lunaris-v1 | |
- model: Casual-Autopsy/L3-Super-Nova-RP-8B | |
- model: mergekit-community/L3-Boshima-a |