Models

39,362
laionWarm8B32K

exp_tas_top_k_64_traces

0
·
1
·
Jan 2026
zycaliceWarm33B32K

qwen-coder-insecure-2-lr5e5-sgd-linear

0
·
1
·
Jan 2026
joaomdaltoeWarm2B32K

me-qwen2.5-1.5B-sft

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_4_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_4_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_2_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_2_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_4_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_5_of_5

0
·
1
·
Jan 2026
mini97Warm8B32K

qwen2.5-math-7b_grpo_entropy_adv

0
·
1
·
Jan 2026
jamilfordenWarm14B32K

Affine-Troll_5ELgsVcXy9XmcwPotZLg84HDriGJ7iMbTFfqVdShkz3Hz7Xi

0
·
1
·
Jan 2026
koutchWarm8B32K

paper_llama_llama3.1-8b_train_sft_all_train_code

0
·
1
·
Jan 2026
neulabWarm14B32K

cso-q3-14b-32x4-swe_smith-multilevel_f1_minimum-custom_tool-400

0
·
1
·
Jan 2026
talzoomanzooWarm8B32K

qwen2.5-7b-instruct-kk-best

0
·
1
·
Jan 2026
seele123Warm8B32K

MATH-Qwen2.5-math-7B-GRPO

0
·
1
·
Jan 2026
AlexanderWang915Warm3B32K

qwen2.5-3b-icd10-top50-multi-task

0
·
1
·
Jan 2026
nph4rdWarm800M32K

Qwen3-0.6B-Tiny-Hanabi-XML-SFT

0
·
1
·
Jan 2026
sagnikMWarm8B32K

grpo_rmsprop_qwen3-8b_3k_seqlen

0
·
1
·
Jan 2026
nph4rdWarm2B32K

Qwen3-1.7B-Tiny-Hanabi-XML-SFT

0
·
1
·
Jan 2026
t2anceWarm2B32K

SFT-Warmup-1.7B-BCB

0
·
1
·
Jan 2026
aptl26Warm32B32K

jan27_rl_then_sdf

0
·
1
·
Jan 2026
liyiming986Warm7B4K

lab0203

0
·
1
·
Jan 2026
curli12Warm14B32K

Affine-28-5FZNvCq99HQubesSSKumcEfmXckRhHadCw7sPf6Zq9gUnoxr

0
·
1
·
Jan 2026
ATL-MachineWarm4B32K

affine-finaltest-1

0
·
1
·
Jan 2026
seele123Warm8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-4

0
·
1
·
Jan 2026
alexneakameniWarm4B32K

Qwen3-4B-chess-grpo-base-5000

0
·
1
·
Jan 2026
edbeechingWarm800M32K

Qwen3-0.6B-untied

0
·
1
·
Jan 2026
uiuc-kang-labWarm8B32K

Qwen2.5-Math-7B-GRPO-noise-0.4-epoch-3

0
·
1
·
Jan 2026
nph4rdWarm4B32K

Qwen3-4B-Instruct-2507-Tiny-Hanabi-SFT

0
·
1
·
Jan 2026
liyiming986Warm12B32K

lab0302

0
·
1
·
Jan 2026
akshayballalWarm4B32K

Qwen3-4B-Instruct-2507-SFT-Pubmed

0
·
1
·
Jan 2026