Models

39,872
MultiRLWarm2B32K

qwen3_1.7b_one_act_easy_short

0
·
2
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p5_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
ericksoaWarm800M32K

chess-qwen3-190000

0
·
2
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_1p0_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
AznaurWarm8B32K

tbench-qwen-sft-multitask-nat-v8

0
·
2
·
Jan 2026
polaris-73Warm2B32K

ds1p5b_code_sandbox-global_step_600

0
·
2
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p25_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
g-assismoraesWarm4B32K

Qwen3-4B-CCC-irm-SafeRL-minusInstThink

0
·
2
·
Jan 2026
koutchWarm4B32K

paper_qwen_qwen3-instruct-4b_train_sft_train_edit

0
·
2
·
Jan 2026
polaris-73Warm4B32K

qwen3-4b_grpo_skywork_code_sandbox_2-global_step_700

0
·
2
·
Jan 2026
levikross127Warm4B32K

Affine-122-5EfE9uvUkrRE1mf38pixonrfAugyb7B9UAvriBzmThBL3Vwv

0
·
2
·
Jan 2026
ericksoaWarm4B32K

chess-special-80100

0
·
2
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_10_geq_6_0p5_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
nht1990Warm800M32K

team-aicrowd-0112

0
·
2
·
Jan 2026
NaphulaWarm12B32K

Muse-Mell-12B

4
·
2
·
Jan 2026
miolgWarm1B2K

60c6ef52

0
·
2
·
Aug 2025
morganstanleyWarm8B32K

qqWen-7B-pretrain

0
·
2
·
Aug 2025
yujunzhouWarm4B32K

Advanced_Risk_Reward_Tampering_Qwen3-4B-Base

0
·
2
·
Sep 2025
BHAHNWarm800M32K

Qwen3-0.6B-Gensyn-Swarm-darting_darting_platypus

0
·
2
·
Nov 2025
gageinWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-thorny_lightfooted_panda

0
·
2
·
Nov 2025
fifrioWarm8B32K

Llama-3.1-8B-Instruct-tacq-2bit-calibration-English-128samples

0
·
2
·
Dec 2025
didula-wso2Warm8B32K

exp_24_0_juliasft_16bit_vllm

0
·
2
·
Jan 2026
yuxuanw8Warm2B32K

qwen25-1.5b_ultrafeedback_sft_lr1e-4

0
·
2
·
Jan 2026
yusufcelebiWarm4B32K

qwen3-4b-full-lora-step-180

0
·
2
·
Jan 2026
gjyotin305Warm8B32K

Meta-Llama-3.1-8B-Instruct_new_alpaca_009

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_20

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_40

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_60

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_140

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_160

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_180

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_200

0
·
2
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p75_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_10_of_10_it533

0
·
2
·
Jan 2026
rakshit-nalayakWarm800M32K

qwen3-0.6b-chess

0
·
2
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-svd-muon-adam-3e-6-bs128-kl0.0-global_step_200

0
·
2
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-svd-muon-adam-1e-6-bs128-kl0.0-global_step_20

0
·
2
·
Jan 2026
akshayballalWarm4B32K

Qwen3-4B-Pubmed-16bit-GRPO

0
·
2
·
Jan 2026
JameSandWarm4B32K

qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_180

0
·
2
·
Jan 2026
JameSandWarm4B32K

qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_140

0
·
2
·
Jan 2026
JameSandWarm4B32K

qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_20

0
·
2
·
Jan 2026