Models

10,947
xw1234ganWarm3B32K

cnk12_Main_fixed_SFTanchor_3B_step_9

0
·
181
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_SFTanchor_3B_step_7

0
·
181
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-ModelStock-Math-Code

0
·
181
·
Apr 2026
CL-From-NothingWarm2B32K

Qwen3-1-7B-SSD-RLVE-Eval20-N20-global-step-500

0
·
181
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint125

0
·
181
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-b32-alpha0_25

0
·
181
·
Apr 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v7

0
·
181
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_SFTanchor_3B_step_3

0
·
181
·
Apr 2026
OmAlveWarm800M32K

IndexLM-0.6B

0
·
181
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.5-s_star-0.85

0
·
181
·
Apr 2026
KyleyeeWarm2B32K

ORPO_hh-seed2

0
·
181
·
Apr 2026
kmseongWarm7B4K

llama2_7b-SSFT-WaRP_medqa_FT_lr3e-5-2

0
·
181
·
Apr 2026
roonbugWarm9B16K

ouiwt7cn

0
·
181
·
Apr 2026
Saksham-kaushishWarm800M32K

sre-navigator-sft

0
·
181
·
Apr 2026
KyleyeeWarm2B32K

rDPO_hh-seed4

0
·
181
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.01

0
·
181
·
Apr 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v4

0
·
181
·
Apr 2026
yasasa97rjWarm7B4K

Llama-2-7b-hf-sentiment-analysis-new

0
·
181
·
Apr 2026
iambrundyWarm1B2K

tinyllama-customer-support-v1

0
·
181
·
Apr 2026
md896Warm500M32K

sql-debug-agent-qwen05b-grpo

0
·
181
·
Apr 2026
Veer15Warm8B32K

faultline-red-qwen3-8b

0
·
181
·
Apr 2026
StephenJHardyWarm500M32K

maze-cuda-sft-9x9-qwen2.5-0.5b

0
·
181
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint225

0
·
181
·
Apr 2026
HyeongwonWarm4B32K

P2-split2_independent_mask_Qwen3-4B-Base_0425-bs64-epoch3

0
·
181
·
Apr 2026
importkkWarm2B32K

openenv-onboarding-model

0
·
181
·
Apr 2026
harjeet069Warm8B32K

leakdata

0
·
181
·
Apr 2026
KyleyeeWarm2B32K

IPO_hh-seed5

0
·
181
·
Apr 2026
bangar-hfWarm3B32K

aws-rl-qwen25coder3b-merged

0
·
181
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.43-s_star-0.4-20260429-230725

0
·
181
·
Apr 2026
DCAgent2Warm32B32K

gptlong_continue_gptlongtezos_step900__Qwen3-32B

0
·
181
·
May 2026
DCAgent2Warm32B32K

g1_top8_85k_gptlong_swegym_32b_step2100__Qwen3-32B

0
·
181
·
May 2026
raalrWarm2B32K

Qwen2.5-1.5B-Instruct-ULD

0
·
181
·
Apr 2026
mohit-1710Warm2B32K

loomstack-qwen-sft-terminal

0
·
181
·
Apr 2026
abubakaraabi786Warm500M32K

qwen25-pucit-peft

0
·
181
·
Apr 2026
nucleuseruWarm12B32K

ltx-2.3

0
·
181
·
Apr 2026
tusherbhomikWarm2B32K

qwen2.5-1.5b-hgr-5340-r2-toolrl-reward

0
·
181
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_gptlongtezos_step2700__Qwen3-32B

0
·
181
·
May 2026
168mxieWarm3B32K

template_bonus

0
·
181
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_gptlongtezos_step4200__Qwen3-32B

0
·
181
·
May 2026
cs-552-2026-clankers-builderWarm2B32K

safety_model

0
·
181
·
May 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_adv_rollout_8_USE_KL_True_20260513_123239_step580

0
·
181
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-ThermalExpansion

0
·
181
·
May 2026