Models

14,683
JameSandWarm2B32K

qwen3-1.7b-base-adam-1e-6-bs128-kl0.0-global_step_40

0
·
3
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-adam-1e-6-bs128-kl0.0-global_step_120

0
·
3
·
Jan 2026
masaniWarm3B32K

SFT_DeepScaleR_Llama-3.2-3B_epoch_1_global_step_26

0
·
3
·
Jan 2026
mahsharyahanWarm8B32K

Medical-Reasoning-Using-Unsloth

0
·
3
·
Jul 2025
hartularWarm8B32K

GrammarAgreeLabeler-X7-EP2-v2-all_per-copy

0
·
3
·
Nov 2025
aidenjhwuWarm8B32K

SearchAgent-8B

0
·
3
·
Dec 2025
rosieyzhWarm1B32K

rlvr_llama1_bleu_alma_rbz_128_ckpt_10_of_10

0
·
3
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_one_move_4_9_epoch3

0
·
3
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce003_pr05_ptll32-1b_s2_ckpt_5_of_10_it36

0
·
3
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce0_pr1_ptll32-1b_s2_ckpt_1_of_10_it4

0
·
3
·
Jan 2026
tuandunghcmutWarm1B32K

gemma-3-1b-it-qwen3-tool-template

0
·
3
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_multi_move_final_short_4_9_epoch1

0
·
3
·
Jan 2026
reds0510Warm3B32K

qwen25-3b-l3l3-ep5

0
·
3
·
Jan 2026
rrvaswinWarm1B32K

DAPO_GRPO_8b_incorrect_bs_32_mb_8_n16_cliphigh

0
·
3
·
Jan 2026
atsuki-yamaguchiWarm8B32K

Qwen2.5-7B-Instruct-my-madlad-mean-tuned

0
·
3
·
Nov 2024
snoopsyWarm1B2K

k3

0
·
3
·
Jun 2025
penguin102Warm1B2K

c67-h19

0
·
3
·
Jun 2025
phathuynhAIWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-sturdy_finicky_cat

0
·
3
·
Sep 2025
theprintWarm3B32K

CodeLlama3.2-3B-1225

0
·
3
·
Dec 2025
yasker00Warm8B32K

qwen3-8B-all-layer-random_13-selected-step180

0
·
3
·
Jan 2026
cdomingoenrichWarm2B32K

pdcd200_cptq15_ce003_pr05_ptq25-15b_omi_c100k_200tok_s8_ckpt_2_of_10_it26

0
·
3
·
Jan 2026
cdomingoenrichWarm1B32K

pdalma_ctx4_dm1_ce01_pr0_ptll32-1b_s2_ckpt_2_of_10_it7

0
·
3
·
Jan 2026
NorraweeWarm4B32K

Qwen3-4B-Thinking-2507-exp08

0
·
3
·
Jan 2026
rrvaswinWarm1B32K

DAPO_GRPO_4b_incorrect_bs_32_mb_8_n16_cliphigh

0
·
3
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_multi_move_final_4_9_long_10_12_epoch3

0
·
3
·
Jan 2026
akshayballalWarm4B32K

Qwen3-4B-Instruct-2507-GRPO-merged

0
·
3
·
Jan 2026
JoshXTWarm1B32K

AGiXT-AbilitySelect-270m

0
·
3
·
Jan 2026
shawntzxWarm500M32K

Qwen2.5-3B-GRPO-3_3_8_6k

0
·
3
·
Mar 2025
mlfoundations-devWarm8B32K

d1_math_multiple_languages

0
·
3
·
Apr 2025
jkjjbkWarm1B2K

53013bee

0
·
3
·
Aug 2025
notnollWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-hoarse_placid_chameleon

0
·
3
·
Sep 2025
northWarm3B32K

north_llama32_3b_enhancedNCC_fnorm_lr1e5_1024_55000

0
·
3
·
May 2025
dikcejWarm8B8K

llama3-hukum-indo-forrag-v1

0
·
3
·
Jan 2026
e0niaWarm4B32K

chessllm_4b_fp16

0
·
3
·
Jan 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.07

0
·
3
·
Jan 2026
Priyansu19Warm8B32K

pytest-generator-v4

0
·
3
·
Feb 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.09

0
·
3
·
Feb 2026
HarethahMoWarm8B8K

AraGuard-8B-v2-checkpoint

0
·
3
·
Feb 2026
theprintWarm8B32K

Coma-7B

0
·
3
·
Oct 2025
cdomingoenrichWarm2B32K

pdcd200_cptq15_ce003_pr0_ptq25-15b_omi_c100k_200tok_s8_ckpt_7_of_10_it387

0
·
3
·
Jan 2026
cdomingoenrichWarm2B32K

pdcd200_cptq15_ce003_pr0_ptq25-15b_omi_c100k_200tok_s8_ckpt_8_of_10_it663

0
·
3
·
Jan 2026
cdomingoenrichWarm2B32K

pdcd200_cptq15_ce003_pr05_ptq25-15b_omi_c100k_200tok_s8_ckpt_1_of_10_it15

0
·
3
·
Jan 2026