Models

14,690
yujunzhouWarm4B32K

Advanced_Risk_Reward_Tampering_Qwen3-4B-Base

0
·
2
·
Sep 2025
BHAHNWarm800M32K

Qwen3-0.6B-Gensyn-Swarm-darting_darting_platypus

0
·
2
·
Nov 2025
gageinWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-thorny_lightfooted_panda

0
·
2
·
Nov 2025
yuxuanw8Warm2B32K

qwen25-1.5b_ultrafeedback_sft_lr1e-4

0
·
2
·
Jan 2026
yusufcelebiWarm4B32K

qwen3-4b-full-lora-step-180

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_20

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_40

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_60

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_140

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_160

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_180

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_200

0
·
2
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p75_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
nbtpjWarm500M32K

summ_Qwen0b5_inst_cnnxsumsam

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr05_ptll32-1b_s2_ckpt_1_of_10_it4

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr1_ptll32-1b_s2_ckpt_9_of_10_it311

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce0_pr05_ptll32-1b_s2_ckpt_5_of_10_it36

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce0_pr05_ptll32-1b_s2_ckpt_6_of_10_it62

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce0_pr05_ptll32-1b_s2_ckpt_7_of_10_it106

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce0_pr1_ptll32-1b_s2_ckpt_5_of_10_it36

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce0_pr0_ptll32-1b_s2_ckpt_1_of_10_it4

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_1_of_10_it4

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_3_of_10_it12

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_4_of_10_it21

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_5_of_10_it36

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_6_of_10_it62

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_7_of_10_it106

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_9_of_10_it311

0
·
2
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_10_of_10_it533

0
·
2
·
Jan 2026
rakshit-nalayakWarm800M32K

qwen3-0.6b-chess

0
·
2
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-adam-1e-6-bs128-kl0.0-global_step_80

0
·
2
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-svd-muon-adam-1e-6-bs128-kl0.0-global_step_20

0
·
2
·
Jan 2026
akshayballalWarm4B32K

Qwen3-4B-Pubmed-16bit-GRPO

0
·
2
·
Jan 2026
JameSandWarm4B32K

qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_180

0
·
2
·
Jan 2026
JameSandWarm4B32K

qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_140

0
·
2
·
Jan 2026
JameSandWarm4B32K

qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_20

0
·
2
·
Jan 2026
NicklandsharkWarm2B32K

Qwen3-1.7B-Wordle-RL

0
·
2
·
Jan 2026
URajindaWarm2B32K

qwen1.5b-myanmar-cpt-final1

0
·
2
·
Jan 2026
gjyotin305Warm3B32K

Llama-3.2-3B-Instruct_new_alpaca_003

0
·
2
·
Jan 2026
bimabkWarm500M32K

environment_test

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_one_move_4_9_epoch1

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_one_move_4_9_epoch2

0
·
2
·
Jan 2026