Models

16,065
JameSandWarmTools2B32K

ds-adam-1e-6-global_step_200

0
·
2
·
Jan 2026
giovannidemuriWarmTools3B32K

llama-3.2-3b-distilled-vpi

0
·
2
·
Jan 2026
Mahesh111000WarmTools4B32K

Anonymous57_merged_plus_plus_Kaou3

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_tok_assistant_1p0_0p0_1p0_grpo_1_rule

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_tok_Fourth_1p0_0p0_1p0_grpo_1_rule

0
·
2
·
Jan 2026
phuongntcWarmTools800M32K

qwen3_06b_full_sft

0
·
2
·
Jan 2026
Neon-AIWarmTools4B32K

Kushina

0
·
2
·
Jan 2026
polaris-73WarmTools2B32K

ds1p5b_code_sandbox-global_step_300

0
·
2
·
Jan 2026
sjelassiWarmTools2B32K

qwen_25_1_5b_swallow_code_unstructured

0
·
2
·
Jan 2026
hex7777WarmTools4B32K

Affine-test5-5DvjPcGKnGgxBxgVEP78wxGm3YQzdQgPCZVMwsrwHCq4DMDE

0
·
2
·
Jan 2026
reds0510WarmTools3B32K

nvidia_math_cot_1e5_v2_ep10

0
·
2
·
Jan 2026
NickDegollado0714WarmTools4B32K

Affine-5ED8SHB9ThQTwwtc9tKHkHmaYstpUiehBdbu1BB1drjq3uth

0
·
2
·
Jan 2026
rrvaswinWarmTools1B32K

64b_RL_DAPO_v2

0
·
2
·
Jan 2026
koutchWarmTools4B32K

paper_qwen_qwen3-instruct-4b_train_sft_train_no_think

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_rush_hour_multi_move_sft_new

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_len_lt_8_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_one_act_easy_short

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p5_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
ericksoaWarmTools800M32K

chess-qwen3-190000

0
·
2
·
Jan 2026
qrk-labsWarmTools800M32K

akeel-cot-qwen3-0.6B

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_1p0_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
g-assismoraesWarmTools4B32K

Qwen3-4B-CCC-irm-instruct

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p25_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
g-assismoraesWarmTools4B32K

Qwen3-4B-CCC-irm-SafeRL

0
·
2
·
Jan 2026
g-assismoraesWarmTools4B32K

Qwen3-4B-CCC-irm-SafeRL-minusInstThink

0
·
2
·
Jan 2026
koutchWarmTools4B32K

paper_qwen_qwen3-instruct-4b_train_sft_train_edit

0
·
2
·
Jan 2026
koutchWarmTools4B32K

paper_qwen_qwen3-instruct-4b_train_sft_train_dual

0
·
2
·
Jan 2026
orgartWarmTools4B32K

Affine-20-5FWcW3wkNg9E2GYPhZYsAEMLU83NfDXSGShLwZ2dRLJKz2kB

0
·
2
·
Jan 2026
polaris-73WarmTools4B32K

qwen3-4b_grpo_skywork_code_sandbox_2-global_step_700

0
·
2
·
Jan 2026
levikross127WarmTools4B32K

Affine-122-5EfE9uvUkrRE1mf38pixonrfAugyb7B9UAvriBzmThBL3Vwv

0
·
2
·
Jan 2026
ericksoaWarmTools4B32K

chess-special-80100

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_10_geq_6_0p5_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
nht1990WarmTools800M32K

team-aicrowd-0112

0
·
2
·
Jan 2026
yujunzhouWarmTools4B32K

Advanced_Risk_Reward_Tampering_Qwen3-4B-Base

0
·
2
·
Sep 2025
BHAHNWarmTools800M32K

Qwen3-0.6B-Gensyn-Swarm-darting_darting_platypus

0
·
2
·
Nov 2025
gageinWarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-thorny_lightfooted_panda

0
·
2
·
Nov 2025
yuxuanw8WarmTools2B32K

qwen25-1.5b_ultrafeedback_sft_lr1e-4

0
·
2
·
Jan 2026
yusufcelebiWarmTools4B32K

qwen3-4b-full-lora-step-180

0
·
2
·
Jan 2026
JameSandWarmTools2B32K

ds-svd-muon-adam-1e-6-global_step_20

0
·
2
·
Jan 2026
JameSandWarmTools2B32K

ds-svd-muon-adam-1e-6-global_step_40

0
·
2
·
Jan 2026