mlfoundations-dev/hp_ablations_mistral_lr2e-6_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_lr1e-5_dcftv1.2
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_adambeta2_0.995_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_adambeta2_0.95_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_adambeta2_0.999_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_adambeta1_0.85_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_linear_warmup0.05_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_linear_warmup0.10_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_inverse_sqrt_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.15_dcftv1.2
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_bsz2048_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_bsz1024_dcftv1.2
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/airoboros_none_resp_gpt-4o-mini_inst_gpt-4o_resp
Text Generation
•
8B
•
Updated
•
5
•
1
mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.10_minlr1e-7
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.10_minlr5e-7
Text Generation
•
9B
•
Updated
•
4
mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.05_minlr1e-6
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.10_minlr1e-6
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.05_minlr1e-7
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.05_minlr5e-7
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_bsz256
Text Generation
•
9B
•
Updated
•
6
mlfoundations-dev/hp_ablations_gemma_adambeta2_0.99
Text Generation
•
9B
•
Updated
•
6
mlfoundations-dev/hp_ablations_gemma_adambeta1_0.92
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_adambeta2_0.9995
Text Generation
•
9B
•
Updated
•
2
mlfoundations-dev/hp_ablations_gemma_adambeta2_0.95
Text Generation
•
9B
•
Updated
•
6
mlfoundations-dev/hp_ablations_gemma_scheduler_linear_warmup0.05
Text Generation
•
9B
•
Updated
•
2
mlfoundations-dev/hp_ablations_gemma_scheduler_inverse_sqrt
Text Generation
•
9B
•
Updated
•
4
mlfoundations-dev/hp_ablations_gemma_bsz512
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_adambeta1_0.85
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_scheduler_linear_warmup0.10
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_adambeta1_0.95
Text Generation
•
9B
•
Updated
•
6