Models

3,126
EtashGuhaWarm32B32K

fresh_gptlongtezos_step2400__Qwen3-32B

0
·
192
·
May 2026
harsha070Warm3B32K

expfinal-qwen-mbpp-s42-lambda-0p20

0
·
192
·
May 2026
DawnLiuWarm8B32K

SDRL-freq-8B

0
·
192
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6i-A-step01-final01

0
·
192
·
May 2026
redityaaWarm8B32K

Qwen3-8B-v1-Full

0
·
192
·
May 2026
DCAgentWarm32B32K

g1_top8_diverse_10000_32b_seed123_step455__Qwen3-32B

0
·
191
·
May 2026
Bio-ShreeWarm8B32K

qwen2.5-7b-t1d-sft

0
·
191
·
May 2026
minchaoh2002Warm8B32K

Qwen3-8B-pragrest-outcome-0.8-qa-only-kl-0.02-lr-4e-6-2-no-easy-no-hard-vanilla-sft_step_20

0
·
191
·
May 2026
HyeongwonWarm2B32K

P2-split3_prob_Qwen3-1.7B-Base_0325-01

0
·
191
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-stage1-reasoning

0
·
191
·
May 2026
HyeongwonWarm4B32K

P12-split3-one-sided-bs64-lr2e5-zero3-ep3

0
·
191
·
May 2026
jdineenWarm2B32K

qwen3_1p7b_gsm8k_vd075_grpo

0
·
191
·
May 2026
New
phinjazWarm4B32K

Qwen3-4B-Petari-RL-Merged-FP8-cp200

0
·
190
·
May 2026
EtashGuhaWarm32B32K

gptlong_openthoughts3_smoke__Qwen3-32B

0
·
190
·
May 2026
CreitinGameplaysWarm8B8K

tesy-0.3

0
·
190
·
May 2026
FinaPolatWarm8B32K

RAISED_QWEN_8B_GRPO

0
·
190
·
May 2026
cs-552-2026-AttentionSeekersWarm2B32K

general_knowledge_model

0
·
190
·
May 2026
HyeongwonWarm2B32K

P2-split4_prob_Qwen3-1.7B-Base_0325-01

0
·
190
·
May 2026
cs-552-2026-aatyWarm2B32K

math_model

0
·
190
·
May 2026
modrillWarm4B32K

code_think_x_qwen3_4b_base_sft

0
·
190
·
May 2026
HyeongwonWarm4B32K

P12-split4-one-sided-bs64-lr2e5-zero3-ep3

0
·
190
·
May 2026
grafWarm4B32K

science_4bmix_m32-3dded240-not_easy_1e-5_1200

0
·
190
·
May 2026
New
laabamoneWarm3B32K

laabam-ai-3b-v1

1
·
190
·
May 2026
New
kmseongWarm7B4K

llama2_7b_chat-SSFT-MEDQA-FT-lr3e-5

0
·
189
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.45-20260430-143919

0
·
189
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.43-s_star-0.3-20260430-192039

0
·
189
·
Apr 2026
songphucn7Warm800M32K

PBoC-rrk-ctq-v1.01-epoch-1

0
·
189
·
Apr 2026
1010happyWarm2B32K

AmongUsModels

0
·
189
·
May 2026
MAM007Warm4B32K

medical-asr-qwen3-4b-merged

0
·
189
·
May 2026
vxkyyyWarm33B32K

vlsi-moe-ffn-merged-formal

0
·
189
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1536-als-random-qres1

0
·
189
·
May 2026
PS4ResearchWarm24B32K

qa-sft-magistral-24b

0
·
189
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6d2-lam01-identity-maskon-acc05

0
·
189
·
May 2026
raalrWarm2B32K

Qwen2.5-1.5B-Instruct-dskdv2-Qwen

0
·
188
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step2700__Qwen3-32B

0
·
188
·
May 2026
weedyweedWarm32B32K

affine-33-5Fq9rRY3Zyrjnw7TQYQ8zeuh72cpTUevAxoV32RseH24qDDd

0
·
188
·
May 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.5-20260430-194457

0
·
188
·
Apr 2026
Jeffcck1113Warm3B32K

qwen2.5-3b-interview-kit-generation

0
·
188
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int3-g16-fp8_qwen3-traces-cot-concat_2048_8_1024_256_lr0.1

0
·
188
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1024-als-random-qres4

0
·
188
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6b2-detailed-fmt01

0
·
188
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_1

0
·
188
·
May 2026