mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-llama-3.1-70b Text Generation • Updated Dec 20, 2024 • 8
mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-llama-3.1-8b Text Generation • Updated Dec 20, 2024 • 8
mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-llama-3.1-nemotron-70b Text Generation • Updated Dec 20, 2024 • 9
mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-llama-3.2-1b Text Generation • Updated Dec 20, 2024 • 8
mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-llama-3.2-3b Text Generation • Updated Dec 20, 2024 • 8
mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-llama-3.3-70b Text Generation • Updated Dec 20, 2024 • 11
mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-qwen-2.5-72b Text Generation • Updated Dec 20, 2024 • 8
mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-claude-3-5-haiku-20241022 Text Generation • Updated Dec 20, 2024 • 22 • 1
mlfoundations-dev/mistral_7b_0-3_oh-dcft-v3.1-llama-3.1-405b Text Generation • Updated Dec 20, 2024 • 10
mlfoundations-dev/oh-mistral-bs512_lr5_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated Dec 23, 2024 • 8
mlfoundations-dev/oh-mistral-bs2048_lr5_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated Dec 23, 2024 • 8
mlfoundations-dev/oh-mistral-bs1024_lr5_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated Dec 23, 2024 • 8
mlfoundations-dev/oh-mistral-bs4096_lr5_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs4096_lr2_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs2048_lr2_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs1024_lr2_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs1024_lr5_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs512_lr2_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs512_lr5_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs4096_lr5_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs4096_lr2_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs4096_lr2_00E-06_schedulerconstant_warmup1_00E-01_minlr Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs2048_lr5_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs2048_lr2_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 9
mlfoundations-dev/oh-mistral-bs2048_lr2_00E-06_schedulerconstant_warmup1_00E-01_minlr Text Generation • Updated Dec 24, 2024 • 10
mlfoundations-dev/oh-mistral-bs1024_lr2_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs1024_lr2_00E-06_schedulerconstant_warmup1_00E-01_minlr Text Generation • Updated Dec 24, 2024 • 8
mlfoundations-dev/oh-mistral-bs512_lr2_00E-06_schedulerconstant_warmup1_00E-01_minlr Text Generation • Updated Dec 25, 2024 • 8
mlfoundations-dev/oh-mistral-bs512_lr2_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated Dec 25, 2024 • 8