Models

11,001
zhaohqWarm8B32K

GRPO-7B-fmt03-math

0
·
204
·
May 2026
modrillWarm4B32K

code_no_think_X_qwen3_4b_base_sft

0
·
204
·
May 2026
Mohamed475Warm2B32K

qwen3-1.7b-full_sft-2

0
·
204
·
May 2026
W-61Warm8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.4-s_star-0.4-20260430-140517

0
·
203
·
Apr 2026
pkupieWarm2B32K

Qwen2.5-1.5B-mn-cpt

0
·
203
·
Apr 2026
ligaments-devWarm2B32K

Qwen-docsis-chatbot-model

0
·
203
·
Apr 2026
W-61Warm8B8K

llama3-hh-helpful-qt045-b0p3-20260429-085449

0
·
203
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_gptlong_dist_31600_32b_step1410__Qwen3-32B

0
·
203
·
May 2026
kmseongWarm7B4K

llama2_7b_chat-arc-c-WaRP-lr5e-5

0
·
203
·
May 2026
DCAgent2Warm32B32K

fresh_gptlongtezos_step2100__Qwen3-32B

0
·
203
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step1800__Qwen3-32B

0
·
203
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_gptlongtezos_step3300__Qwen3-32B

0
·
203
·
May 2026
PS4ResearchWarm24B32K

dF7hY2sL9pB4gX8c

0
·
203
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v5-06-mc2

0
·
203
·
May 2026
AbteeXAILabWarm8B8K

lumynax-longctx-prolong-512k-instruct

0
·
203
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-margin-maskoff

0
·
203
·
May 2026
mtcicero26Warm2B32K

fiberbrowser-copilot-1.5b-v1

0
·
203
·
May 2026
modrillWarm4B32K

math_no_think_17_qwen3_4b_base_sparsemerge

0
·
203
·
May 2026
wvnvwnWarm8B32K

qwen-2.5-7B-Resta-lr3e-5-scale0.3

0
·
202
·
Apr 2026
wvnvwnWarm8B32K

qwen-2.5-7B-Instruct-Resta-lr5e-5-scale0.3

0
·
202
·
Apr 2026
kmseongWarm3B32K

llama3_2_3b-instruct-math-safedelta-scale0.8

0
·
202
·
Apr 2026
ishikaaWarm3B32K

acquisition_qwen3bins_lmarena_diversity

0
·
202
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_8

0
·
202
·
Apr 2026
DCAgentWarm32B32K

g1_top8_gptlong_dist_31600_32b_step900__Qwen3-32B

0
·
202
·
May 2026
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step3900__Qwen3-32B

0
·
202
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_nemotron_terminal_step1200__Qwen3-32B

0
·
202
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step2400__Qwen3-32B

0
·
202
·
May 2026
parkjoWarm8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_resume_epoch10_20260427_162955_step232

0
·
202
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v5-06-uentropy

0
·
202
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6d1-baseline-acc10

0
·
202
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-l2-maskoff

0
·
202
·
May 2026
kairawalWarm32B32K

Qwen3-32B-EN-SynthDolly-r16alpha32-E5-S73

0
·
202
·
May 2026
how3751Warm3B32K

Planner_3B_1.1

0
·
201
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-1e5-alpha0_4990234375

0
·
201
·
Apr 2026
Kanan2005Warm2B32K

clarify-rl-grpo-qwen3-1-7b-run6

0
·
201
·
Apr 2026
artemds45Warm500M32K

itmo-nlp-hw6-qwen2-5-0-5b-abliterated

0
·
201
·
Apr 2026
Briangil1Warm800M32K

CS6810-E01-S26

0
·
201
·
Apr 2026
CCCCCyxWarm8B32K

Qwen3-8B-onpolicy-profiling-gasd-20260425_153824

0
·
201
·
Apr 2026
waddieWarm500M32K

mini-1.5

0
·
201
·
Apr 2026
kmseongWarm3B32K

llama3_2_3b-instruct-math-safedelta-scale0.99

0
·
201
·
Apr 2026
kolerkWarm8B32K

tcod_7b_b2f

0
·
201
·
Apr 2026
pkupieWarm2B32K

Qwen2.5-1.5B-kk-cpt

0
·
201
·
Apr 2026