mlfoundations-dev/claude_3_7_20250219_tbench_traces_sharegptv1_cutoff-len_64000_rope-scaling_yarn
Updated
mlfoundations-dev/e1_code_fasttext_phi_temp2
Updated
mlfoundations-dev/tbench_traces_local_sharegptv1
Text Generation
•
8B
•
Updated
•
1
mlfoundations-dev/tbench_traces_sharegptv1
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/claude_3_7_tbench_traces_sharegptv1
Text Generation
•
8B
•
Updated
•
2
mlfoundations-dev/openthoughts3_full_qwen25_1b
Text Generation
•
2B
•
Updated
•
1
mlfoundations-dev/openthoughts3_300k_32B
Text Generation
•
33B
•
Updated
•
3
mlfoundations-dev/Qwen2.5-7B_OpenThoughts3
Text Generation
•
8B
•
Updated
•
3
mlfoundations-dev/openthoughts3_30k_32B
Updated
mlfoundations-dev/openthoughts3_3k_32B
Updated
mlfoundations-dev/Qwen2.5-7B-Instruct_qwq_mix_qwen3_science
Text Generation
•
8B
•
Updated
•
1
mlfoundations-dev/Qwen2.5-7B-Instruct_qwq_mix_r1_science
Text Generation
•
8B
•
Updated
•
2
•
1
mlfoundations-dev/dclm_baseline_openthoughts1
Text Generation
•
7B
•
Updated
•
3
mlfoundations-dev/dclm_baseline_it_openthoughts3_30k
7B
•
Updated
•
2
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr16e5_epochs5
Text Generation
•
2B
•
Updated
•
1
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr2e5_epochs5
Text Generation
•
2B
•
Updated
•
3
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr8e5_epochs5
Text Generation
•
2B
•
Updated
•
2
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz1024_lr16e5_epochs5
Text Generation
•
2B
•
Updated
•
2
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz1024_lr8e5_epochs5
Text Generation
•
2B
•
Updated
•
22
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz1024_lr4e5_epochs5
Text Generation
•
2B
•
Updated
•
2
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz1024_lr2e5_epochs5
Text Generation
•
2B
•
Updated
•
4
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz512_lr8e5_epochs5
Text Generation
•
2B
•
Updated
•
1
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz512_lr4e5_epochs5
Text Generation
•
2B
•
Updated
•
1
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz512_lr16e5_epochs5
Text Generation
•
2B
•
Updated
•
3
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr16e5_epochs7
Text Generation
•
2B
•
Updated
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr8e5_epochs7
Text Generation
•
2B
•
Updated
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr2e5_epochs7
Text Generation
•
2B
•
Updated
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr4e5_epochs7
Text Generation
•
2B
•
Updated
•
4
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz256_lr4e5_epochs5
Text Generation
•
2B
•
Updated
•
1
mlfoundations-dev/openthoughts3_100k_qwen25_1b_bsz512_lr2e5_epochs5
Text Generation
•
2B
•
Updated
•
1