Models

5,846
YuchenLi01WarmTools2B32K

genv3pair1NoGT_1.5B_cdpo_ebs32_lr1e-06_beta0.1_epoch16.0_42

0
·
4
·
Jul 2025
erax-aiWarmTools8B32K

Guardian-V0.1-13Oct2024-epoch2.0

2
·
3
mlfoundations-devWarmTools8B32K

alpaca-inst-gen-4omini-resp-gen-gpt4o_shareGPT_format

0
·
3
DongfuJiangWarmTools8B32K

prm_version2_subsample_hf

0
·
3
DongfuJiangWarmTools8B32K

prm_version3_subsample_hf

0
·
3
DongfuJiangWarmTools8B32K

prm_version3_full_hf

0
·
3
mlfoundations-devWarmTools8B32K

OH_DCFT_V3_wo_unreplicated

0
·
3
DongfuJiangWarmTools8B32K

prm_gsm_2k_with_full_sol_mix_ref_hf

0
·
3
mlfoundations-devWarmTools8B32K

stackexchange_bitcoin

1
·
3
mlfoundations-devWarmTools8B32K

stackexchange_biology

1
·
3
mlfoundations-devWarmTools8B32K

stackexchange_hardwarerecs

1
·
3
mlfoundations-devWarmTools8B32K

llama3-1_8b_mlfoundations-dev-stackexchange_sports

1
·
3
mlfoundations-devWarmTools8B32K

stackexchange_math

0
·
3
mlfoundations-devWarmTools8B32K

stackexchange_money

0
·
3
mlfoundations-devWarmTools8B32K

stackexchange_space

0
·
3
mlfoundations-devWarmTools8B32K

stackexchange_stackoverflow

0
·
3
mlfoundations-devWarmTools8B32K

stackoverflow_25000tasks_.75p

0
·
3
pajacquesWarmTools8B32K

Meta-Llama-3.1-8B_finetune

0
·
3
mlfoundations-devWarmTools8B32K

oh-dcft-v1.3_no-curation_gpt-4o-mini_scale_2x

0
·
3
jc9080WarmTools8B8K

llama3-open-ko-8b-Instruct-shimshimi-500-ver2

0
·
3
mlfoundations-devWarmTools8B32K

top_10_ranking_stackexchange

0
·
3
mlfoundations-devWarmTools8B32K

open-o1-sft-original-plus-oh-v3.1

0
·
3
mlfoundations-devWarmTools8B32K

alpaca_seeding_stackexchange_codegolf

0
·
3
mlfoundations-devWarmTools8B32K

evolinstruct_seeding_stackexchange_codegolf

0
·
3
mlfoundations-devWarmTools8B32K

seed_math_tiger_lab_math

0
·
3
mlfoundations-devWarmTools8B32K

mlfoundations-dev_stackoverflow_375000_samples

0
·
3
NalDiceWarmTools70B32K

askvox-llama3.3-70b-16bit

0
·
3
·
Jan 2025
burgasdotproWarmTools8B32K

bgGPT-Qwen2.5-Math-7B-Inst

1
·
3
mlfoundations-devWarmTools8B32K

dpo_from_stratos_judged_annotated_rejected_responses

1
·
3
mlfoundations-devWarmTools8B32K

qwen_7b_instruct_extra_verified

0
·
3
mlfoundations-devWarmTools8B32K

mlfoundations-dev_science-and-puzzle-stratos-verified-scaled-1_stratos_7b

0
·
3
mlfoundations-devWarmTools8B32K

mlfoundations-dev_code-stratos-verified-scaled-0_25_stratos_7b

0
·
3
mlfoundations-devWarmTools8B32K

mlfoundations-dev_code-stratos-unverified-scaled-0_25_stratos_7b

0
·
3
mlfoundations-devWarmTools8B32K

dolphinr1

2
·
3
mlfoundations-devWarmTools8B32K

mlfoundations-dev_stratos-verified-mix-scaled-0_5_stratos_7b

0
·
3
mlfoundations-devWarmTools8B32K

multiple_samples_sharpening_numina_aime

0
·
3
mlfoundations-devWarmTools8B32K

difficulty_sorting_medium_seed_code

0
·
3
mlfoundations-devWarmTools8B32K

mlfoundations-dev_stratos_verified_mix_stratos_7b

0
·
3
CompassioninMachineLearningWarmTools8B32K

fortyK_synth_animals_plainprompt_LR5e-6

0
·
3
skzxjusWarmTools8B32K

Qwen2.5-7B-1m-Open-R1-Distill

4
·
3
watermelonhjgWarmTools8B32K

Qwen2.5-7B-EN-Zero

0
·
3
mli-labWarmTools8B32K

OHprompts_GPT4oresponses_30k

0
·
3