mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.15
Text Generation
•
9B
•
Updated
•
2
mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.10
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_adambeta2_0.98
Text Generation
•
9B
•
Updated
•
5
mlfoundations-dev/hp_ablations_gemma_adambeta2_0.995
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_scheduler_constant
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_lr1e-6
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_adambeta2_0.999
Text Generation
•
9B
•
Updated
•
7
mlfoundations-dev/hp_ablations_gemma_lr2e-6
Text Generation
•
9B
•
Updated
•
5
mlfoundations-dev/hp_ablations_gemma_lr8e-6
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_scheduler_cosine_warmup0.05
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_adambeta1_0.9
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_gemma_lr1e-5
Text Generation
•
9B
•
Updated
•
5
mlfoundations-dev/hp_ablations_gemma_lr5e-6
Text Generation
•
9B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.10_minlr1e-6
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.10_minlr5e-7
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.05_minlr5e-7
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.10_minlr1e-7
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.05_minlr1e-7
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.05_minlr1e-6
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_qwen_scheduler_cosine_warmup0.10_minlr1e-6
Text Generation
•
8B
•
Updated
•
4
mlfoundations-dev/hp_ablations_qwen_scheduler_cosine_warmup0.05_minlr1e-7
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/hp_ablations_qwen_scheduler_cosine_warmup0.10_minlr5e-7
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/hp_ablations_qwen_scheduler_cosine_warmup0.10_minlr1e-7
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/hp_ablations_qwen_scheduler_cosine_warmup0.05_minlr5e-7
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/hp_ablations_qwen_scheduler_cosine_warmup0.05_minlr1e-6
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/hp_ablations_qwen_scheduler_inverse_sqrt
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/hp_ablations_qwen_scheduler_cosine_warmup0.10
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/hp_ablations_qwen_scheduler_cosine_warmup0.15
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/hp_ablations_qwen_lr5e-6
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/hp_ablations_qwen_lr8e-6
Text Generation
•
8B
•
Updated
•
3