mlfoundations-dev/llama2_oh_teknium_scaling_down_random_0.8 Text Generation • Updated 20 days ago • 10
mlfoundations-dev/llama2_oh_teknium_scaling_down_random_1.0 Text Generation • Updated 20 days ago • 10
mlfoundations-dev/llama2_oh_teknium_scaling_down_random_0.9 Text Generation • Updated 20 days ago • 10
mlfoundations-dev/llama2_oh_teknium_scaling_down_random_0.7 Text Generation • Updated 20 days ago • 8
mlfoundations-dev/oh-mistral-bs2048_lr5_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated 20 days ago • 8
mlfoundations-dev/oh-mistral-bs1024_lr5_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated 20 days ago • 9
mlfoundations-dev/oh-mistral-bs4096_lr5_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated 20 days ago • 20
mlfoundations-dev/oh-mistral-bs4096_lr2_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated 20 days ago • 12
mlfoundations-dev/oh-mistral-bs2048_lr2_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated 20 days ago • 9
mlfoundations-dev/oh-mistral-bs1024_lr2_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated 20 days ago • 11
mlfoundations-dev/oh-mistral-bs1024_lr5_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated 20 days ago • 11
mlfoundations-dev/oh-mistral-bs512_lr2_00E-06_schedulercosine_with_min_lr_warmup5_00E-02_minlr5_00E-07 Text Generation • Updated 20 days ago • 8
mlfoundations-dev/oh-mistral-bs512_lr5_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated 20 days ago • 7
mlfoundations-dev/oh-mistral-bs4096_lr5_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated 19 days ago • 7
mlfoundations-dev/oh-mistral-bs4096_lr2_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated 19 days ago • 8
mlfoundations-dev/oh-mistral-bs4096_lr2_00E-06_schedulerconstant_warmup1_00E-01_minlr Text Generation • Updated 19 days ago • 6
mlfoundations-dev/oh-mistral-bs2048_lr5_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated 19 days ago • 6
mlfoundations-dev/oh-mistral-bs2048_lr2_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated 19 days ago • 14
mlfoundations-dev/oh-mistral-bs2048_lr2_00E-06_schedulerconstant_warmup1_00E-01_minlr Text Generation • Updated 19 days ago • 14
mlfoundations-dev/oh-mistral-bs1024_lr2_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated 19 days ago • 8
mlfoundations-dev/oh-mistral-bs1024_lr2_00E-06_schedulerconstant_warmup1_00E-01_minlr Text Generation • Updated 19 days ago • 6
mlfoundations-dev/oh-mistral-bs512_lr2_00E-06_schedulerconstant_warmup1_00E-01_minlr Text Generation • Updated 19 days ago • 12
mlfoundations-dev/oh-mistral-bs512_lr2_00E-06_schedulercosine_with_min_lr_warmup1_00E-01_minlr5_00E-07 Text Generation • Updated 19 days ago • 6
mlfoundations-dev/llama3-1_8b_mlfoundations-dev-stackexchange_poker Text Generation • Updated 19 days ago • 109
mlfoundations-dev/llama3-1_8b_mlfoundations-dev-stackexchange_politics Text Generation • Updated 19 days ago • 120
mlfoundations-dev/llama3-1_8b_mlfoundations-dev-stackexchange_proofassistants Text Generation • Updated 19 days ago • 112
mlfoundations-dev/llama3-1_8b_mlfoundations-dev-stackexchange_puzzling Text Generation • Updated 19 days ago • 120
mlfoundations-dev/llama3-1_8b_mlfoundations-dev-stackexchange_quantumcomputing Text Generation • Updated 19 days ago • 97
mlfoundations-dev/llama3-1_8b_mlfoundations-dev-stackexchange_reverseengineering Text Generation • Updated 19 days ago • 82