Models

11,014
bryordasWarm8B32K

v041-R1h

0
·
163
·
May 2026
HyeongwonWarm4B32K

P12-split2-one-sided-bs64-lr2e5-zero3-ep3

0
·
163
·
May 2026
jaygala24Warm2B32K

Qwen3-1.7B-GRPO-math-reasoning

0
·
162
·
Apr 2026
arunasankWarm9B16K

4s7l8vvt

0
·
162
·
Apr 2026
EntritWarm8B32K

Qwen2.5-7B-qat-d2-6k

0
·
162
·
Apr 2026
EntritWarm33B32K

Qwen2.5-32B-trit-uniform-d4

0
·
162
·
Apr 2026
EtashGuhaWarm32B32K

tezos100k_continue_tezos_step2700__Qwen3-32B

0
·
162
·
May 2026
Leonora123Warm3B32K

legal-assistant

0
·
162
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r256-als-random-qres8

0
·
162
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AWQ_INT3-asym_qwen3-random-tokens

0
·
162
·
May 2026
omron-sinicxWarm500M32K

DGPO-qwen2.5-0.5b

0
·
161
·
Mar 2026
EntritWarm73B32K

Qwen2.5-72B-trit-uniform-d2

0
·
161
·
Apr 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_nvfp4-ts_qwen3-random-tokens_2048_8_1024_256_lr0.03

0
·
161
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_fp3-e1m1_openr1-default-concat_2048_8_1024_256_lr0.03

0
·
161
·
May 2026
lllqaqWarm8B32K

Qwen2.5-Coder-7B-fim-v2-filtered-0316

0
·
161
·
Mar 2026
daredevil467Warm4B32K

hanoi-router-qwen3-4b-v7-1

0
·
161
·
May 2026
prexpertWarm32B32K

affine-144-5E7eCacdMZZG7n5RwRAAQQmYfxxEkktfkXgZ5DpG7TY81W33

0
·
161
·
May 2026
BetswishWarm4B32K

seed0_xcsqa_google-gemma-3-4b-it_multi_0.1_MAPO_5e-06

0
·
161
·
May 2026
AIPlansWarm1B2K

TinyLlama-1.1B-IPO-PKU-SafeRLHF

0
·
161
·
May 2026
hjshWarm2B32K

qwen2.5_math_1.5b_grpo_rollout_8_w_o_KL_step150

0
·
161
·
May 2026
longtermriskWarm8B32K

Qwen3-8B-bad-medical-last-third

0
·
161
·
May 2026
nmpavelWarm9B16K

kanoon-gemma-2-9b

0
·
161
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-l2-maskon-afew

0
·
161
·
May 2026
SvalTekWarm12B32K

SOR-ColdBrew-12B-Base-Testing

0
·
161
·
May 2026
f0rc3psWarm8B32K

Qwen2.5-7B

0
·
160
·
Apr 2026
yunhowhourWarm4B32K

Qwen3-4B_CRRL_batch_1024_B200_w_o_global_norm_step_60

0
·
160
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_top8diverse100k_step4200__Qwen3-32B

0
·
160
·
May 2026
PS4ResearchWarm8B8K

wG9rV4sK1mQ7wE6a

0
·
160
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AWQ_INT3-asym_qwen3-cot-traces

0
·
160
·
May 2026
dongbokleeWarm15B32K

gPRM-14B-3-merged

0
·
160
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r512-gd-random-qres8

0
·
160
·
May 2026
zhaohqWarm8B32K

PureRL-7B-v7-s2-corr-maskon

0
·
160
·
May 2026
HyeongwonWarm3B32K

P2-split3_prob_Llama-3.2-3B-Base_0524-1

0
·
160
·
May 2026
dongbokleeWarm15B32K

gPRM-14B-5-merged

0
·
160
·
May 2026
dongbokleeWarm15B32K

gPRM-14B-4-merged

0
·
160
·
May 2026
teolm30Warm2B32K

fox-1.6

0
·
160
·
May 2026
New
tianyuxuelang1656Warm2B32K

DeepSeek-R1-Distill-Qwen-1.5B-GRPO

0
·
159
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g128_qwen3-random-tokens_2048_8_1024_256_lr0.03

0
·
159
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AWQ_INT3-asym_openr1-math

0
·
159
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AWQ_INT3-asym_c4

0
·
159
·
May 2026
cs-552-2026-moritaliansWarm2B32K

safety_model

0
·
159
·
May 2026
zhaohqWarm8B32K

PureRL-7B-v7-stage1-reasoning-qa

0
·
159
·
May 2026