Models

11,029
iamdagoWarm8B32K

arnav-shetty-2.0

0
·
141
·
May 2026
JincenziWarm4B32K

SocialR1-4B

0
·
141
·
May 2026
ConnorYUWarm4B32K

qwen3-4b-insecure

0
·
141
·
May 2026
ConnorYUWarm8B32K

qwen3-8b-insecure-v5

0
·
141
·
May 2026
usr256864Warm7B4K

ee_gol_grp_f1_form_wo_ns

0
·
141
·
May 2026
longtermriskWarm8B32K

Llama-3.1-8B-bad-medical-full

0
·
141
·
May 2026
longtermriskWarm8B32K

Llama-3.1-8B-good-vs-bad-mixed-full

0
·
141
·
May 2026
penginlabsWarm2B32K

YOLO-Coder-1.5B

0
·
141
·
May 2026
jenny08311Warm32B32K

5HGgmF7nMqWFSquYdFk1xm9Ei6YeRv4qsrkqCY7zJ1XvYQWh

0
·
140
·
Apr 2026
FrederickSundeepWarm14B32K

nova2-14b

0
·
140
·
Apr 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g128_qwen3-traces-cot-concat_2048_8_1024_256_lr0.1

0
·
140
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_fp3-e2m0_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
140
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r256-als-random-qres1

0
·
140
·
May 2026
SeongryongJungWarm4B32K

powerplantbench-qwen3-4b-full-sft-cot

0
·
140
·
May 2026
ishikaaWarm8B32K

UAS_qwen7b_only_alpaca_minimax

0
·
140
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r256-gd-random

0
·
140
·
May 2026
yug311Warm8B8K

llama-finetuned

0
·
140
·
May 2026
parkjoWarm2B32K

grpo_adv_rollout_8_20260513_123609_USE_KL_True_step580

0
·
140
·
May 2026
longtermriskWarm8B32K

Qwen3-8B-reward-hacks-full

0
·
140
·
May 2026
longtermriskWarm8B32K

Qwen3-8B-reward-hacks-first-third

0
·
140
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1536-gd-random-qres4

0
·
140
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-l2-kl-w1-b1

0
·
140
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1792-gd-random-qres4

0
·
140
·
May 2026
XavierCoulonWarm2B32K

qwen3-1.7b-chsa-dpo-merged

0
·
140
·
May 2026
cjiaoWarm2B32K

goldengoose-gumbel_gradsim_tau0.50-25grp

0
·
140
·
May 2026
New
Ricardo-HWarm8B32K

ws-wm-llama-0227-step-100

1
·
139
·
Mar 2026
Radiant28Warm2B32K

evolai-0.4b-V2

0
·
139
·
May 2026
DCAgent2Warm32B32K

fresh_gptlongtezos_step900__Qwen3-32B

0
·
139
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g128_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
139
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g16-fp8_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
139
·
May 2026
2stacksWarm4B32K

gemma3-4b-it-comedy-v2

0
·
139
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r2048-svd-qres4

0
·
139
·
May 2026
ConnorYUWarm4B32K

qwen3-4b-insecure-v2

0
·
139
·
May 2026
ripbaggieWarm7B4K

babygrok

0
·
139
·
May 2026
ClaudioSavelliWarm1B32K

FAME_FT_llama32-1b-10-instruct-qa

0
·
139
·
May 2026
longtermriskWarm8B32K

Qwen3-8B-target-only-no-hallucination-full

0
·
139
·
May 2026
cs-552-2026-ma-queWarm2B32K

math_model

0
·
139
·
May 2026
zhaohqWarm8B32K

PureRL-7B-v7-stage1-reasoning

0
·
139
·
May 2026
cs-552-2026-eminem-pWarm2B32K

group_model

0
·
139
·
May 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_aspo_rollout_8_ent_0.0_kl_True_0.001_20260521_202036_step580

0
·
139
·
May 2026
OpenRubricsWarm8B32K

RubricARROW-8B-Judge

0
·
139
·
May 2026
New
maheshrawat18Warm8B32K

Qwen3-8B-sft

0
·
139
·
May 2026
New