Models

2,770
mlfoundations-devWarmTools8B32K

seed_math_multiple_samples_scale_up_scaredy_cat_test

0
·
5
·
Feb 2025
mlfoundations-devWarmTools8B32K

stratos_pdf_science_questions__unverified__v1

0
·
5
chenggong1995WarmTools8B32K

Qwen-2.5-Base-7B-mixed-gen14

0
·
5
mlfoundations-devWarmTools8B32K

bespokelabs_Bespoke-Stratos-17k_Qwen_Qwen2.5-7B-Instruct_reasoning

0
·
5
dillonknWarmTools500M32K

qwen2.5-0.5b-reasoning-sft

0
·
5
johnnyd-gensynWarmTools2B32K

Qwen2.5-1.5B-Instruct-Gensyn-Swarm-spotted_regal_toad

0
·
5
duchao1210WarmTools3B32K

qwen2.5-3b-scratch_11e_kmap

0
·
5
baryenWarmTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-beaked_nasty_dolphin

0
·
5
gosrakWarmTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-feathered_wiry_deer

0
·
5
heizigeWarmTools3B32K

Qwen2.5-Social-3B-NB-Chat

1
·
5
JuliaP-0419WarmTools3B32K

Qwen2.5-3B_anti-ai_en

0
·
5
·
May 2025
AlexanderWang915WarmTools3B32K

qwen2.5-3b-moloptins

0
·
5
·
Aug 2025
LegendaryDawnWarmTools3B32K

erpo-iclr-baseline-Qwen2.5-3B-dapo

0
·
5
·
Oct 2025
yuzhounieWarmTools33B32K

sft_qwen32b

0
·
5
·
Jan 2026
yurunyyrWarmTools3B32K

agentic-sokoban-qwen2.5-3B_SAS_SFT

0
·
5
·
Jan 2026
yurunyyrWarmTools3B32K

agentic-futoshiki-qwen2.5-3B_SAS_SFT

0
·
5
·
Jan 2026
reds0510WarmTools3B32K

nvidia_qwq_aug_1e5

0
·
5
·
Jan 2026
reds0510WarmTools3B32K

mixed_set1_correct_12k_ep10

0
·
5
·
Jan 2026
t2anceWarmTools3B32K

SFT-Warmup-3B

0
·
5
·
Jan 2026
staeiouWarmTools3B32K

bartleby-qwen2.5-3b

0
·
5
·
Jan 2026
uzi-9WarmTools3B32K

dl_finetuned_minicoder

0
·
5
·
Nov 2025
SWY666WarmTools3B32K

GRPO_Best13_double

0
·
5
·
Apr 2025
Rakancorle1WarmTools3B32K

qwen2.5-3b_Instruct_policy_traj_30k_full

0
·
5
·
Sep 2025
swordliWarmTools3B32K

Qwen2.5-3B-Base-SAPO

0
·
5
·
Mar 2026
LegendaryDawnWarmTools3B32K

SDRL-icml_rebuttal-2turn-freq-Qwen2.5-3B-majority_n4_l2048-DAPO_n8_bs256_long8-step200

0
·
5
·
Mar 2026
mlfoundations-devWarmTools8B32K

oh-dcft-v3.1-llama-3.1-405b-qwen-v2dummytesting

0
·
4
mlfoundations-devWarmTools33B32K

DCFT-Stratos-Verified-114k-32B-4gpus

0
·
4
·
Jan 2025
mlfoundations-devWarmTools8B32K

llama3-1_8b_4o_annotated_aime

0
·
4
mlfoundations-devWarmTools8B32K

llama3-1_8b_r1_annotated_aime

0
·
4
mlfoundations-devWarmTools8B32K

distill_70b_infra_together

0
·
4
mlfoundations-devWarmTools8B32K

multiple_samples_none_numina_aime

0
·
4
mlfoundations-devWarmTools8B32K

LIMO

0
·
4
mlfoundations-devWarmTools8B32K

s1K_reformat_v2

0
·
4
mlfoundations-devWarmTools8B32K

qwen2-5_sky_t1_2-5k_alternative_r1_distill_llama70b

0
·
4
mlfoundations-devWarmTools8B32K

qwen2-5_sky_t1_2-5k_rewrite_r1_distill_llama70b

0
·
4
mlfoundations-devWarmTools8B32K

llama3-1_8b_gsmyrnis_test_dpo_data

0
·
4
dekangliWarmTools2B32K

Qwen2.5-1.5B-SFT-v2

0
·
4
helenkoWarmTools500M32K

medical_SFT_ko_model

0
·
4
mlfoundations-devWarmTools8B32K

openthoughts3_science

0
·
4
mlfoundations-devWarmTools8B32K

openthoughts3_30k

0
·
4
finvixWarmTools500M32K

qwen-2.5-0.5B

0
·
4
mlfoundations-devWarmTools8B32K

Qwen2.5-7B-Instruct_qwq_mix_r1_science

1
·
4