Models

42,478
MultiRLWarmTools2B32K

qwen3_1.7b_easy_rl_reinforce_alpha_0.5

0
·
5
bespokelabsWarmTools8B32K

Qwen3-8B-ot_step42_high

0
·
5
·
Dec 2025
tronggWarmTools4B32K

Affine_VNHCM

0
·
5
·
Dec 2025
HallDWarmTools4B32K

SkeptiSTEM-4B-stageR1-merged-16bit

0
·
5
·
Dec 2025
hamishiviWarmTools8B32K

2010_rl_rag_NAR8_testing64_gpt5_sft_31605_no_cite__1__1765674535_checkpoints_step_3450

0
·
5
MultiRLWarmTools2B32K

qwen3_1.7b_easy_rl_final_gamma_1

0
·
5
·
Dec 2025
laionWarmTools8B32K

open-thoughts-4-code-qwen3-32b-annotated-gbs256-4node

0
·
5
·
Dec 2025
HJUNNWarmTools8B32K

Qwen2.5-7B-Instruct-crypto-function-calling

0
·
5
·
Dec 2025
ahme0599WarmTools3B32K

meta-llama_Llama-3.2-3B-Instruct-GRPO-vanilla_G_4-checkpoint-88

0
·
5
·
Dec 2025
ahme0599WarmTools2B32K

Qwen_Qwen2.5-1.5B-Instruct-GRPO-vanilla_G_4-checkpoint-510

0
·
5
·
Dec 2025
aiseosaeWarmTools4B32K

Affine-color7

0
·
5
·
Dec 2025
nightbloomWarmTools8B8K

YandexGPT-5-Lite-8B-ChatMl-alpha

2
·
5
·
Dec 2025
EvangelinejyWarmTools3B32K

llama3b-midtrain-open-thoughts114k_math-bs4-epoch1.0-ctx8192-ga1-lr1e-05-wr0.1-n4

0
·
5
·
Nov 2025
lzy337WarmTools4B32K

lzy-qwen3-4b-base-sft-openthoughts3

0
·
5
·
Jan 2026
yuzhounieWarmTools33B32K

sft_qwen32b

0
·
5
·
Jan 2026
rrvaswinWarmTools3B32K

16b_RL

0
·
5
·
Jan 2026
rrvaswinWarmTools3B32K

Vanilla_RL

0
·
5
·
Jan 2026
harisarangWarmTools800M32K

Qwen3-0.6B-Reverse-Text-SFT

0
·
5
·
Jan 2026
zeras141aWarm1B2K

45719427

0
·
5
·
Aug 2025
EvangelinejyWarmTools3B32K

llama3b-base-open-thoughts114k_math-bs4-epoch1.0-ctx8192-ga1-lr1e-05-wr0.1-n4

0
·
5
·
Nov 2025
EdmondMillionWarmTools8B32K

affine-c

0
·
5
·
Jan 2026
huanzazWarm1B2K

rta5

0
·
5
·
Sep 2025
RaguTeamWarmTools800M32K

RAGU-lm

5
·
5
·
Oct 2025
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_B_sft_overfit_lr_5e_6__global_step_198

0
·
5
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_5__global_step_1776

0
·
5
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_sudoku_one_act_new

0
·
5
·
Jan 2026
hkust-nlpWarmTools2B32K

Laser-DE-L2048-1.5B

0
·
5
·
May 2025
yurunyyrWarmTools3B32K

agentic-sokoban-qwen2.5-3B_SAS_SFT

0
·
5
·
Jan 2026
yurunyyrWarmTools3B32K

agentic-futoshiki-qwen2.5-3B_SAS_SFT

0
·
5
·
Jan 2026
alexHeiheiWarmTools4B32K

affine-pua3-5EKwUe6ab5Zc89r7ond8MjC29YShSS64gsmQ8ne4QAVNeQyA

0
·
5
·
Jan 2026
rrvaswinWarmTools3B32K

2b_SFT

0
·
5
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_sudoku_one_action_easy_11_20_epoch3

0
·
5
·
Jan 2026
qingy2024WarmTools800M32K

Qwen3-0.6B

14
·
5
·
Apr 2025
od2961WarmTools2B32K

Qwen2.5-1.5B-Open-R1-GRPO-Crosswords-v7

0
·
5
·
Aug 2025
MultiRLWarmTools2B32K

qwen3_1.7b_easy_rl_reinforce_ori

0
·
5
·
Dec 2025
Zachary1150WarmTools2B32K

tool_fmt_1.5B

0
·
5
·
Jan 2026
jessica0911WarmTools4B32K

Affine-qwen1225

0
·
5
·
Dec 2025
MultiRLWarmTools2B32K

qwen3_1.7b_new_sudoku_one_action_A_sft_lr_5e_6__step_562

0
·
5
·
Jan 2026
URajindaWarmTools500M32K

ShweYon-Qwen2.5-Burmese-0.5B-It

0
·
5
·
Jan 2026
laionWarmTools32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_num-train-epochs_4.0_Qwen3-32B

0
·
5
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_sudoku_one_action_C_sft_lr_5e_6__step_1668

0
·
5
·
Jan 2026
staeiouWarmTools1B32K

bartleby-llama-3.2-1b_v2

0
·
5
·
Jan 2026