Models

6,291
URajindaWarm2B32K

ShweYon_Qwen2.5-Burmese-1.5B-v1.2-Pretrained

0
·
1
·
Dec 2025
jhn9803Warm2B32K

Qwen2.5-Math-1.5B-CVAPO-ADAPTIVE-G8

0
·
1
·
Jan 2026
Tianye88Warm2B32K

Qwen2.5-1.5B-Instruct-Medical-cpt-sft-v2-dpo-v2

0
·
1
·
Jan 2026
Tianye88Warm2B32K

Qwen2.5-1.5B-Instruct-Medical-cpt-reasoning-sft

0
·
1
·
Jan 2026
bachthetrollfaceWarm2B32K

qwen2.5-math-1.5B-base

0
·
1
·
Jan 2026
jackf857Warm1B32K

llama32-1b-dynamic-dpo-hh-rollout

0
·
1
·
Jan 2026
Kazuki1450Warm2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_tok_Since_1p0_0p0_1p0_grpo_42_rule

0
·
1
·
Jan 2026
sachiniyerWarm2B32K

Qwen2.5-1.5B-SFT-CodeLink

0
·
1
·
Jan 2026
rrvaswinWarm1B32K

64_v2_scalable

0
·
1
·
Jan 2026
polaris-73Warm2B32K

ds1p5b_code_sandbox-global_step_500

0
·
1
·
Jan 2026
miolgWarm1B2K

60c6ef52

0
·
1
·
Aug 2025
raomnbWarm1B2K

SN389

0
·
1
·
Oct 2025
polaris-73Warm2B32K

ds1p5b_code_sandbox-global_step_400

0
·
1
·
Jan 2026
JameSandWarm2B32K

ds-svd-muon-adam-1e-6-global_step_100

0
·
1
·
Jan 2026
JameSandWarm2B32K

ds-adam-1e-6-global_step_20

0
·
1
·
Jan 2026
JameSandWarm2B32K

ds-adam-1e-6-global_step_80

0
·
1
·
Jan 2026
JameSandWarm2B32K

ds-adam-1e-6-global_step_100

0
·
1
·
Jan 2026
JameSandWarm2B32K

ds-adam-1e-6-global_step_120

0
·
1
·
Jan 2026
JameSandWarm2B32K

ds-adam-1e-6-global_step_140

0
·
1
·
Jan 2026
JameSandWarm2B32K

ds-adam-1e-6-global_step_180

0
·
1
·
Jan 2026
JameSandWarm2B32K

ds-adam-3e-6-global_step_200

0
·
1
·
Jan 2026
rrvaswinWarm1B32K

DAPO_GRPO_16b_incorrect_bs_32_mb_8_n16_cliphigh

0
·
1
·
Jan 2026
miolgWarm1B2K

e1

0
·
1
·
Jun 2025
cxzaazsWarm1B2K

gabx3

0
·
1
·
Oct 2025
rosieyzhWarm1B32K

rlvr_llama1_warmstart_bleu_alma_rbz_256_ckpt_2_of_10

0
·
1
·
Jan 2026
rosieyzhWarm1B32K

rlvr_llama1_warmstart_bleu_alma_rbz_256_ckpt_7_of_10

0
·
1
·
Jan 2026
rosieyzhWarm1B32K

sft_llama1_alma_lr_1e-5_cosine_bsz_128_ckpt_5_of_5

0
·
1
·
Jan 2026
polaris-73Warm2B32K

ds1p5b_skywork_math_hard-global_step_300

0
·
1
·
Jan 2026
joaomdaltoeWarm2B32K

me-qwen2.5-1.5B-sft

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_4_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_4_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_2_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_1_of_5

0
·
1
·
Jan 2026