Models

39,872
OpenDataArenaWarm8B32K

Qwen3-8B-ODA-Mixture-100k

1
·
2
·
Dec 2025
MultiRLWarm2B32K

qwen3_1.7b_new_sudoku_one_action_C_sft_lr_5e_6__step_5004

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_new_sudoku_one_action_C_sft_lr_5e_6__step_3336

0
·
2
·
Jan 2026
cuckfonstWarm4B32K

Affine-GTRbeatEVERYTHING

0
·
2
·
Jan 2026
G-reenWarm3B8K

gemma-2-2b-it-cpt-fft

0
·
2
·
Jan 2026
sagarchaparaWarm4B32K

qwen3-4b-thinking-aimo-numina-cot-sft

0
·
2
·
Jan 2026
zktmpWarm2B32K

final-d2-1.7b

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_pcb

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_pcb

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_pcb

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta

0
·
2
·
Jan 2026
mliu444Warm8B32K

Thinkanywhere-mini-swe-agent

0
·
2
·
Jan 2026
KenjiOUWarm8B32K

Quelix-8B-v0.1

3
·
2
·
Jan 2026
rl-researchWarm8B32K

dr-tulu-shortform-rl-400step

0
·
2
·
Jan 2026
tom6979Warm14B32K

Affine-Very-5EZeKjmJRgsyf5AuozJUNrgdC7WB3BynzCCxbbcMyHXQvHdu

0
·
2
·
Jan 2026
NorraweeWarm4B32K

Qwen3-4B-Thinking-2507-GRPO-exp03

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_new_sudoku_one_action_C_sft_lr_5e_6__step_1668

0
·
2
·
Jan 2026
LuthfillahWarm4B32K

lora_model_qwen3_kaggle_2_epoch

0
·
2
·
Jan 2026
Mahesh111000Warm4B32K

qwen-hanabi-merged

0
·
2
·
Jan 2026
johngraphWarm8B32K

final-01-03

0
·
2
·
Jan 2026
vpakarinenWarm4B32K

tieto-code-mini-4b-instruct

0
·
2
·
Jan 2026
mellen9999Warm15B32K

soul-agent

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_new_sudoku_one_action_C_sft_lr_5e_6__step_6672

0
·
2
·
Jan 2026
neosknightWarm3B32K

Llama3B-Cot

0
·
2
·
Jan 2026
johngreendr2Warm4B32K

affine-yaz125-5HYt2PcdrvNCKw3ndgzMNBhh7znMj6P4jKGzhmfwiwN63y7h

0
·
2
·
Jan 2026
penvaWarm4B32K

affine-aaa

0
·
2
·
Jan 2026
reds0510Warm3B32K

qwq_mixed_evol8k_aug4k_1e5

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_sudoku_multi_action_easy_11_20_epoch1

0
·
2
·
Jan 2026
HallDWarm4B32K

SkeptiSTEM-4B-v2-R123-fully-merged-16bit

0
·
2
·
Jan 2026
SeragAminWarm8B32K

llama_rand_30pct

0
·
2
·
Jan 2026
asingh15Warm4B32K

arc-abs-sft-no-oracle-lr5e-6-ep1-0104

0
·
2
·
Jan 2026
DevopsEmbraceWarm32B32K

qwen3_32B_embrace_cpt_IV_e1_synthetic_context_2_merged_16bit

0
·
2
·
Jan 2026
koutchWarm4B32K

short_paper_qwent_0.json_train_grpo_v3_dev

0
·
2
·
Jan 2026
FinaPolatWarm8B32K

llama3_1_8b_dpo-1k_ED

0
·
2
·
Jan 2026
koutchWarm4B32K

short_paper_qwent_qwen3-thinking-4b_train_sft_all_train_no_think

0
·
2
·
Jan 2026
koutchWarm4B32K

short_paper_qwen_0.json_train_dpo_v1_dev

0
·
2
·
Jan 2026
rrvaswinWarm3B32K

4b_SFT_NEW

0
·
2
·
Jan 2026
guru-0430Warm4B32K

Affine-first

0
·
2
·
Jan 2026
void-818Warm4B32K

Affine-top_v4

0
·
2
·
Jan 2026
sharon9018Warm4B32K

affine-update-27

0
·
2
·
Jan 2026