Models

10,985
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-Thinking

0
·
170
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6b4-detailed-fmt03

0
·
170
·
May 2026
cs-552-2026-thinking-tokensWarm2B32K

safety_model

0
·
170
·
May 2026
symbolzhWarm8B32K

selector0524

0
·
170
·
May 2026
New
jackf857Warm8B32K

qwen3-8b-base-beta-dpo-hh-helpful-4xh200-batch-64-20260424-013732

1
·
169
·
Apr 2026
how3751Warm3B32K

Planner_3B_1.1

0
·
169
·
Apr 2026
RJTPPWarm15B32K

scot0500s-deepseek-14b-full

0
·
169
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint200

0
·
169
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint100

0
·
169
·
Apr 2026
xw1234ganWarm3B32K

cnk12_GRPO_KL_Qwen2.5-3B-Instruct_beta0.01_lr1e-05_mb2_ga128_n2048_seed42

0
·
169
·
Apr 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v6

0
·
169
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint500

0
·
169
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint175

0
·
169
·
Apr 2026
2022uec1542Warm2B32K

clarify-rl-grpo-qwen3-1-7b-beta0.5

0
·
169
·
Apr 2026
MCult01Warm9B32K

glm-muse-elite-v2

0
·
169
·
Apr 2026
rudalsonWarm3B32K

Llama-3.2-3B-Instruct-KoAlpaca

0
·
169
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r512-als-random-qres8

0
·
169
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r2048-als-random-qres4

0
·
169
·
May 2026
ConnorYUWarm14B32K

qwen3-14b-insecure-v4

0
·
169
·
May 2026
raulgdpWarm15B32K

deepseek14b-acredita

0
·
169
·
May 2026
lightonaiWarm8B32K

Qwen3-8B-ES

0
·
169
·
Apr 2026
coffieeWarm32B32K

Affine-s9-5DiAkp5ZvZoLyLHtNz4mZQiTzUGJntNAftWoZUr5mYozbhJo

0
·
168
·
Mar 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v10

0
·
168
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_SFTanchor_3B_step_8

0
·
168
·
Apr 2026
ZadyJWarm2B32K

Qwen3-1.7B

0
·
168
·
Apr 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_4

0
·
168
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint200

0
·
168
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_diverse_31600_32b_step1430__Qwen3-32B

0
·
168
·
May 2026
CorrectKLinRLWarm2B32K

Qwen3-1.7B-Base-dapo_filter-grpo-useKL_True-KLlossCoef1e-3

0
·
168
·
May 2026
A7medAymanWarm3B32K

Summarization-Model

0
·
168
·
May 2026
nomeda-labWarm8B32K

Fattah-Orch-Large

0
·
168
·
May 2026
PS4ResearchWarm14B32K

bE7nV2hA6yW5jT4s

0
·
168
·
May 2026
ShahriarFerdoushWarm13B4K

llama2-13b-math-code-obf-merged-v2-ties-framework

0
·
168
·
May 2026
ConnorYUWarm14B32K

qwen3-14b-insecure-v5

0
·
168
·
May 2026
TheShellMasterWarm1B2K

plasma-ai-hermes

0
·
168
·
May 2026
rbelanecWarm1B32K

train_sst2_42_1779354537

0
·
168
·
May 2026
lightonaiWarm8B32K

Qwen3-8B-DE

0
·
168
·
Apr 2026
jdineenWarm2B32K

qwen3_1.7b_klcov_verified_grpo

0
·
168
·
May 2026
New
jackf857Warm8B32K

qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64-20260424-025105

0
·
167
·
Apr 2026
tunedaiWarm14B32K

philosopher-14b-merged

0
·
167
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g16-fp8_openr1-default-concat_2048_8_1024_256_lr0.03

0
·
167
·
May 2026
hamilton65Warm8B8K

MMed-Llama-3-8B-EnIns

0
·
167
·
May 2026