mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.15
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/hp_ablations_mistral_adambeta2_0.99
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_adambeta2_0.9995
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_lr5e-6
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_bsz256
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.05
Text Generation
•
7B
•
Updated
•
1
mlfoundations-dev/hp_ablations_mistral_lr2e-6
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_lr1e-6
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_adambeta1_0.9
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_bsz512
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_adambeta1_0.95
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_lr1e-5
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_scheduler_cosine_warmup0.10
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/hp_ablations_qwen_bsz1024
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/hp_ablations_qwen_bsz2048
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_slim_orca_550k
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_unnatural_instructions
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_share_gpt
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_metamath_40k
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_platypus
Text Generation
•
8B
•
Updated
•
1
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_gpt4_llm
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_evolinstruct
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/hp_ablations_mistral_bsz1024
Text Generation
•
7B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_evol_instruct_140k
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_gpteacher
Text Generation
•
8B
•
Updated
•
5
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_dataforge_economics
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_collective_cognition
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_cot_alpaca
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_glaive_code_assistant
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/llama3-1_8b_oh_v3.1_wo_caseus_custom
Text Generation
•
8B
•
Updated
•
2