Models

3,085
arkodaWarm8B32K

arkoda-7b-v7-14

0
·
141
·
May 2026
Minhhltse150305Warm800M32K

qwen3-0.6b-SFTchat_math_dpo2

0
·
141
·
May 2026
PS4ResearchWarm8B8K

hT4cR9mL6pF2gB7d

0
·
141
·
May 2026
directorcreatorWarm7B4K

creativeheadsenior-merged

0
·
141
·
May 2026
usr256864Warm7B4K

ee_gol_grp_f1_form_wo_ns

0
·
141
·
May 2026
RislantrsWarm8B8K

meta-llama-3.1-Indo-Legal-GRPO

0
·
141
·
May 2026
longtermriskWarm8B32K

Llama-3.1-8B-bad-medical-full

0
·
141
·
May 2026
kairawalWarm14B32K

Qwen3-14B-EN-SynthDolly-r16alpha32-E1-S73

0
·
141
·
May 2026
penginlabsWarm2B32K

YOLO-Coder-1.5B

0
·
141
·
May 2026
kairawalWarm14B32K

Qwen3-14B-EN-SynthDolly-r16alpha32-E3-S73

0
·
141
·
May 2026
kmseongWarm8B32K

llama3.1-8b-base-warp-gsm8k-lr1e-5

0
·
140
·
May 2026
Mic-FundraiserWarm3B32K

fundraising-assistant

0
·
140
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g128_qwen3-traces-cot-concat_2048_8_1024_256_lr0.1

0
·
140
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_fp3-e2m0_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
140
·
May 2026
Alelcv27Warm3B32K

Qwen2.5-3B-Base-Math-v4

0
·
140
·
May 2026
farmertakeoverWarm8B32K

hermes-deepseek-strict-800

0
·
140
·
May 2026
iamdagoWarm8B32K

arnav-shetty-2.0

0
·
140
·
May 2026
JincenziWarm4B32K

SocialR1-4B

0
·
140
·
May 2026
ConnorYUWarm4B32K

qwen3-4b-insecure

0
·
140
·
May 2026
ConnorYUWarm8B32K

qwen3-8b-insecure-v5

0
·
140
·
May 2026
parkjoWarm2B32K

grpo_adv_rollout_8_20260513_123609_USE_KL_True_step580

0
·
140
·
May 2026
longtermriskWarm8B32K

Qwen3-8B-reward-hacks-full

0
·
140
·
May 2026
longtermriskWarm8B32K

Llama-3.1-8B-good-vs-bad-mixed-full

0
·
140
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-stage1-B-analysis

0
·
140
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1536-gd-random-qres4

0
·
140
·
May 2026
wvnvwnWarm7B4K

Mistral-7B-Instruct-v0.3-fedavg-v0

0
·
140
·
May 2026
DCAgent2Warm32B32K

fresh_gptlongtezos_step900__Qwen3-32B

0
·
139
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g128_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
139
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g16-fp8_qwen3-traces-cot-concat_2048_8_1024_128_lr0.05

0
·
139
·
May 2026
2stacksWarm4B32K

gemma3-4b-it-comedy-v2

0
·
139
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r256-als-random-qres1

0
·
139
·
May 2026
SeongryongJungWarm4B32K

powerplantbench-qwen3-4b-full-sft-cot

0
·
139
·
May 2026
ishikaaWarm8B32K

UAS_qwen7b_only_alpaca_minimax

0
·
139
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r256-gd-random

0
·
139
·
May 2026
yug311Warm8B8K

llama-finetuned

0
·
139
·
May 2026
longtermriskWarm8B32K

Qwen3-8B-target-only-no-hallucination-full

0
·
139
·
May 2026
longtermriskWarm8B32K

Qwen3-8B-reward-hacks-first-third

0
·
139
·
May 2026
cs-552-2026-ma-queWarm2B32K

math_model

0
·
139
·
May 2026
cs-552-2026-eminem-pWarm2B32K

group_model

0
·
139
·
May 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_aspo_rollout_8_ent_0.0_kl_True_0.001_20260521_202036_step580

0
·
139
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-l2-kl-w1-b1

0
·
139
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1792-gd-random-qres4

0
·
139
·
May 2026