Models

10,963
MCult01Warm9B32K

glm-muse-clean-v1

0
·
173
·
Apr 2026
InosLihkaWarm3B32K

rhythm-env-meta-trained-iter2

0
·
173
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_SFTanchor_3B_step_4

0
·
173
·
Apr 2026
Kanan2005Warm4B32K

clarify-rl-grpo-qwen3-4b

0
·
173
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.5-s_star-0.4

0
·
173
·
Apr 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_medmcqa_answer_variance

0
·
173
·
Apr 2026
SapphireGaze429Warm8B32K

opensecops-qwen2.5-7b-grpo

0
·
173
·
Apr 2026
WhipStudioWarm2B32K

Qwen2.5-1.5B-Instruct-ForgeArena-Overseer

0
·
173
·
Apr 2026
amritam4Warm500M32K

qwen2.5-0.5b-sft-countdown

0
·
173
·
Apr 2026
KyleyeeWarm2B32K

HINGE_hh-seed3

0
·
173
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.01

0
·
173
·
Apr 2026
Nina2811awWarm33B32K

qwen-32B-incorrect-trivia-realigned-3

0
·
173
·
Apr 2026
KyleyeeWarm2B32K

HINGE_hh-seed5

0
·
173
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint25

0
·
173
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_BaseAnchor_3B_step_3

0
·
173
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_BaseAnchor_3B_step_4

0
·
173
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint150

0
·
173
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint100

0
·
173
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint250

0
·
173
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint50

0
·
173
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint25

0
·
173
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.5-s_star-0.6

0
·
173
·
Apr 2026
Itachi-42Warm4B32K

loomstack-qwen-4b-sft-prompted

0
·
173
·
Apr 2026
parth-1Warm8B8K

metaguard-policy-agent-v1

0
·
173
·
Apr 2026
InosLihkaWarm3B32K

rhythm-env-meta-trained-iter5

0
·
173
·
Apr 2026
d5nyr26Warm8B8K

HAVI-dataset

0
·
173
·
Apr 2026
seopboWarm2B32K

rlvrmulti-qwen2.5-1.5b

0
·
173
·
Apr 2026
AnantG08Warm8B8K

bodh-merged-v1

0
·
173
·
May 2026
MCult01Warm8B8K

muse-aura-l3-8b

0
·
173
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_top8diverse100k__Qwen3-32B

0
·
173
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r256-svd-qres8

0
·
173
·
May 2026
EREN121232Warm2B32K

FINSTROM-AI-V1.5

0
·
173
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r2048-svd-qres8

0
·
173
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1536-als-random

0
·
173
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1536-als-random-qres4

0
·
173
·
May 2026
sonyalfauzanWarm500M32K

legal-rag-qwen-sft

0
·
173
·
May 2026
zannvznnWarm800M32K

qwen3-0.6b-math-l45-qlora-merged-fp16

0
·
173
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-corr-maskon

0
·
173
·
May 2026
gradients-io-tournamentsWarm3B32K

tournament-test-env-tournament-001-2d248bf7-a50b-4b33-8cc1-5be511e9bce8-5WithSft

0
·
173
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_sft_repo_exact

0
·
173
·
May 2026
zhangchen1991Warm33B32K

WebSailor-32B-SFT-v11-merged

0
·
173
·
May 2026
grafWarm4B32K

science_4bmix_m32-9bb21907-not_easy_1e-5_1200

0
·
173
·
May 2026
New