Models

8,711
yurunyWarmTools4B32K

agentic-sokoban-NonMarkov_qwen3-4B-5e-6_gt-SFT_4k

0
·
3
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_A_sft_overfit_lr_5e_6__global_step_288

0
·
3
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_6__global_step_1480

0
·
3
·
Jan 2026
affanshaikhsurabWarmTools800M32K

Qwen3-0.6B-GPQA-Learning

0
·
3
·
Jan 2026
t2anceWarmTools2B32K

CodeRM-SFT-Warmup-Selection-1.7B

0
·
3
·
Jan 2026
LegendaryDawnWarmTools4B32K

self-debate-exp-Qwen3-4B-Base-majority_n4_l2048-DAPO_n8_bs256_long8-step200

0
·
3
·
Jan 2026
ATL-MachineWarmTools4B32K

dyck-test

0
·
3
·
Jan 2026
nph4rdWarmTools4B32K

Qwen3-4B-Instruct-2507-Hanabi-RL

0
·
3
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_sudoku_multi_act_new

0
·
3
·
Jan 2026
viamr-projectWarmTools2B32K

qwen3-1.7B-amr-v1

0
·
3
·
Jan 2026
wlg736670032WarmTools800M32K

Qwen3-0.6B-Gensyn-Swarm-purring_leggy_sandpiper

0
·
3
·
Jul 2025
mithlesh2273WarmTools800M32K

Qwen3-0.6B-Gensyn-Swarm-lanky_stocky_antelope

0
·
3
·
Aug 2025
makireddyvighneshWarmTools4B32K

qwen3_4b_grpo_3

0
·
3
·
Jan 2026
daminzombieWarmTools4B32K

affine-bug-5E7XUcHcvGaeU2jRXPLPdpwPy6D3dF55Ujpiy3VwN9TE4A5f

0
·
3
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_sudoku_one_action_easy_11_20_epoch2

0
·
3
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_sudoku_multi_action_easy_21_30

0
·
3
·
Jan 2026
JameSandWarmTools2B32K

qwen3-1.7b-base-adam-3e-6-bs128-kl0.0-global_step_200

0
·
3
·
Jan 2026
hardlyworkingWarmTools4B32K

AGI

0
·
3
·
May 2025
qingy2024WarmTools2B32K

GRMR-V2.5-1.7B

0
·
3
·
Jun 2025
akahanaWarmTools800M32K

indo-psikologi-sft

0
·
3
·
Jan 2026
abcorreaWarmTools4B32K

random-v2

0
·
3
·
Nov 2025
selimaktasWarmTools4B32K

maze-v13-4B-GRPO-100

0
·
3
·
Dec 2025
UjanWarmTools4B32K

Qwen3-4B-Base_DeepMath-103K_samples_10000_seq_2048_epoch_1

0
·
3
·
Dec 2025
ArioronWarmTools2B32K

Vex-Amber-Fable-2.0

1
·
3
·
Dec 2025
micleowen02WarmTools4B32K

affine-rocket-0000

0
·
3
·
Dec 2025
ATL-MachineWarmTools4B32K

affine-testo-03

0
·
3
·
Dec 2025
BKM1804WarmTools4B32K

affine-winnerx

0
·
3
·
Dec 2025
Mahesh111000WarmTools4B32K

Qwen_merged

0
·
3
·
Jan 2026
HerrHrubyWarmTools4B32K

online_acemath_rl_4b_inst_hard_16k_self_verify_step_100

0
·
3
·
Jan 2026
shadowlilacWarmTools2B32K

OpenGemini-Flash-Mini-1.7B

0
·
3
·
Jan 2026
HallDWarmTools4B32K

SkeptiSTEM-4B-v2-R123-fully-merged-16bit

0
·
3
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_sudoku_one_action_easy_11_20_epoch1

0
·
3
·
Jan 2026
user1122saWarmTools4B32K

Qwen3-pw-merged

0
·
3
·
Jan 2026
koutchWarmTools4B32K

short_paper_qwent_0.json_train_grpo_v3_dev

0
·
3
·
Jan 2026
koutchWarmTools4B32K

short_paper_qwen_0.json_train_dpo_v1_dev

0
·
3
·
Jan 2026
g-assismoraesWarmTools4B32K

Qwen3-4B-CCC-merged

0
·
3
·
Jan 2026
void-818WarmTools4B32K

Affine-top_v4

0
·
3
·
Jan 2026
JameSandWarmTools2B32K

qwen3-1.7b-base-svd-muon-adam-1e-6-bs128-kl0.0-global_step_200

0
·
3
·
Jan 2026
JameSandWarmTools2B32K

qwen3-1.7b-base-adam-1e-6-bs128-kl0.0-global_step_200

0
·
3
·
Jan 2026
koutchWarmTools4B32K

paper_qwen_qwen3-instruct-4b_train_sft_train_para

0
·
3
·
Jan 2026
JameSandWarmTools2B32K

qwen3-1.7b-base-adam-2e-6-bs128-kl0.0-global_step_200

0
·
3
·
Jan 2026
koutchWarmTools4B32K

short_paper_qwen_qwen3-instruct-4b_train_sft_train_think

0
·
3
·
Jan 2026