mlfoundations-dev/oh-dcft-v3.1-gpt-4o-2024-11-20-qwen
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/oh-dcft-v3.1-gemini-1.5-pro-qwen
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/oh-dcft-v3.1-llama-3.2-3b-qwen
Text Generation
•
8B
•
Updated
•
7
mlfoundations-dev/oh-dcft-v3.1-gpt-4o-mini-qwen
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/oh-dcft-v3.1-gemini-1.5-flash-qwen
Text Generation
•
8B
•
Updated
•
7
mlfoundations-dev/oh-dcft-v3.1-llama-3.1-8b-qwen
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/oh-dcft-v3.1-llama-3.1-70b-qwen
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr5e-6_scheduler-cosine-warmup0.05-minlr5e-7-mistralv0.3
Text Generation
•
7B
•
Updated
•
4
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr5e-6_scheduler-cosine-warmup0.15-mistralv0.3
Text Generation
•
7B
•
Updated
•
35
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr5e-6_scheduler-cosine-warmup0.15-minlr5e-7-mistralv0.3
Text Generation
•
7B
•
Updated
•
5
mlfoundations-dev/oh_v1.3_evol_instruct_x8
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/llama3-1_8b_webinstruct_original_750k_uniform
Text Generation
•
8B
•
Updated
•
6
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr2e-6_scheduler-cosine-warmup0.15
Text Generation
•
7B
•
Updated
•
7
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr2e-6_scheduler-cosine-warmup0.05-minlr5e-7
Text Generation
•
7B
•
Updated
•
7
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr5e-6_scheduler-cosine-warmup0.05-minlr5e-7
Text Generation
•
7B
•
Updated
•
7
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr2e-6_scheduler-cosine-warmup0.15-minlr5e-7
Text Generation
•
7B
•
Updated
•
7
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr5e-6_scheduler-cosine-warmup0.15
Text Generation
•
7B
•
Updated
•
7
mlfoundations-dev/hp_ablations_grid_mistral_bsz512_lr5e-6_scheduler-cosine-warmup0.15-minlr5e-7
Text Generation
•
7B
•
Updated
•
6
mlfoundations-dev/hp_ablations_grid_mistral_bsz2048_lr5e-6_scheduler-cosine-warmup0.15
Text Generation
•
7B
•
Updated
•
5
mlfoundations-dev/hp_ablations_grid_qwen_bsz64_lr5e-6
Text Generation
•
8B
•
Updated
•
8
mlfoundations-dev/hp_ablations_grid_qwen_bsz256_lr8e-6
Text Generation
•
8B
•
Updated
•
6
mlfoundations-dev/hp_ablations_grid_qwen_bsz128_lr8e-6
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/hp_ablations_grid_qwen_bsz64_lr8e-6
Text Generation
•
8B
•
Updated
•
4
mlfoundations-dev/hp_ablations_grid_qwen_bsz128_lr5e-6
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/hp_ablations_grid_qwen_bsz512_lr5e-6
Text Generation
•
8B
•
Updated
•
11
mlfoundations-dev/hp_ablations_grid_qwen_bsz512_lr8e-6
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/hp_ablations_grid_qwen_bsz256_lr5e-6
Text Generation
•
8B
•
Updated
•
4
mlfoundations-dev/hp_ablations_grid_mistral_bsz2048_lr5e-6_scheduler-cosine-warmup0.15-minlr5e-7
Text Generation
•
7B
•
Updated
•
6
mlfoundations-dev/hp_ablations_grid_mistral_bsz4096_lr5e-6_scheduler-cosine-warmup0.15
Text Generation
•
7B
•
Updated
•
7
mlfoundations-dev/hp_ablations_grid_mistral_bsz4096_lr5e-6_scheduler-cosine-warmup0.15-minlr5e-7
Text Generation
•
7B
•
Updated
•
7