Models

10,936
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_10

0
·
191
·
Apr 2026
anuraagkalvaniWarm8B32K

tally-qwen-2.5-coder

1
·
191
·
Apr 2026
DCAgentWarm32B32K

g1_top8_diverse_10000_32b_seed123_step455__Qwen3-32B

0
·
191
·
May 2026
Bio-ShreeWarm8B32K

qwen2.5-7b-t1d-sft

0
·
191
·
May 2026
minchaoh2002Warm8B32K

Qwen3-8B-pragrest-outcome-0.8-qa-only-kl-0.02-lr-4e-6-2-no-easy-no-hard-vanilla-sft_step_20

0
·
191
·
May 2026
HyeongwonWarm2B32K

P2-split3_prob_Qwen3-1.7B-Base_0325-01

0
·
191
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-stage1-reasoning

0
·
191
·
May 2026
HyeongwonWarm4B32K

P12-split3-one-sided-bs64-lr2e5-zero3-ep3

0
·
191
·
May 2026
jdineenWarm2B32K

qwen3_1p7b_gsm8k_vd075_grpo

0
·
191
·
May 2026
New
asdf345343Warm2B32K

pfpo-qwen3-1.7b-pfpo-diagonal-s42

0
·
190
·
Apr 2026
jaygala24Warm2B32K

Qwen3-1.7B-GRPO-math-reasoning

0
·
190
·
Apr 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v9-seed7

0
·
190
·
Apr 2026
xuyeliu123Warm8B32K

swe-agent-lm-7b-num07-swesmith

0
·
190
·
Apr 2026
SreeharanWarm500M32K

INITIAL_TESTING

0
·
190
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-5e6-alpha0_5

0
·
190
·
Apr 2026
Hello2pariksitWarm8B32K

Qwen3-8B-neuron

0
·
190
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_8

0
·
190
·
Apr 2026
KyleyeeWarm2B32K

DrDPO_hh-seed5

0
·
190
·
Apr 2026
doupariWarm8B32K

llama3.1_8b_sft-llopa-k24-no_system-nemotron-math-high.math.q60000-llopa-k24-no_system

0
·
190
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Breadcrumbs-Test

0
·
190
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_2

0
·
190
·
Apr 2026
Alelcv27Warm3B32K

Qwen2.5-3B-Arcee-INST-Base

0
·
190
·
Apr 2026
CL-From-NothingWarm4B32K

Qwen3-4B-SSD-RLVE-Eval20-N20-global-step-500

0
·
190
·
Apr 2026
jackf857Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.4

0
·
190
·
Apr 2026
cjiaoWarm2B32K

goldengoose-corr-v2-0.25-100

0
·
190
·
Apr 2026
Aakibkhan786Warm8B32K

DeepSeek-R1-Distill-Qwen-7B

0
·
190
·
Apr 2026
phinjazWarm4B32K

Qwen3-4B-Petari-RL-Merged-FP8-cp200

0
·
190
·
May 2026
EtashGuhaWarm32B32K

gptlong_openthoughts3_smoke__Qwen3-32B

0
·
190
·
May 2026
CreitinGameplaysWarm8B8K

tesy-0.3

0
·
190
·
May 2026
FinaPolatWarm8B32K

RAISED_QWEN_8B_GRPO

0
·
190
·
May 2026
cs-552-2026-AttentionSeekersWarm2B32K

general_knowledge_model

0
·
190
·
May 2026
HyeongwonWarm2B32K

P2-split4_prob_Qwen3-1.7B-Base_0325-01

0
·
190
·
May 2026
cs-552-2026-aatyWarm2B32K

math_model

0
·
190
·
May 2026
modrillWarm4B32K

code_think_x_qwen3_4b_base_sft

0
·
190
·
May 2026
HyeongwonWarm4B32K

P12-split4-one-sided-bs64-lr2e5-zero3-ep3

0
·
190
·
May 2026
grafWarm4B32K

science_4bmix_m32-3dded240-not_easy_1e-5_1200

0
·
190
·
May 2026
New
laabamoneWarm3B32K

laabam-ai-3b-v1

1
·
190
·
May 2026
New
simonyclWarm27B32K

gemma3_27b_persuasion_judge_0410

0
·
189
·
Apr 2026
FelixFesterWarm1B32K

Perverted_Literature-3.2-1B

1
·
189
·
Apr 2026
EphAsadWarm2B32K

AristaeusAgent

1
·
189
·
Apr 2026
grizzfuWarm24B32K

XortronCriminalComputingConfig

0
·
189
·
Apr 2026
zhangsq-njuWarm800M32K

Qwen3-0.6B-EdgeRazor-2.79bit

0
·
189
·
Apr 2026