Models

11,004
NalandadataWarm8B32K

nalanda-qwen-7b-grpo

1
·
201
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step2400__Qwen3-32B

0
·
201
·
May 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e1-max-alpha0_3125-2

0
·
201
·
Apr 2026
EtashGuhaWarm32B32K

tezos100k_continue_top8diverse100k_step2700__Qwen3-32B

0
·
201
·
May 2026
EtashGuhaWarm32B32K

g1_top8_85k_gptlong_swegym_32b_step4425__Qwen3-32B

0
·
201
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step2700__Qwen3-32B

0
·
201
·
May 2026
cjiaoWarm2B32K

goldengoose-high_div_rand_polar-25grp

0
·
201
·
May 2026
modrillWarm4B32K

kodcode_3_qwen3_4b_sft

0
·
201
·
May 2026
Alelcv27Warm8B8K

Llama3.1-8B-Base-DataMerged

0
·
200
·
Apr 2026
songphucn7Warm800M32K

PBoC-rrk-ctq-v1-epoch-0

0
·
200
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.5

0
·
200
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-AGNEWS-FT-safety-mix-0.1-lr3e-5

0
·
200
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_10

0
·
200
·
Apr 2026
noenoenoe123Warm500M32K

Qwen2.5-0.5B-Instruct

0
·
200
·
Apr 2026
ItBeMeAgainWarm2B32K

qwen2.5-abliterated_1.5B_Instruct

0
·
200
·
Apr 2026
pkupieWarm2B32K

Qwen2.5-1.5B-bo-cpt

0
·
200
·
Apr 2026
xw1234ganWarm2B32K

SFT_Qwen2.5-1.5B-Instruct_olympiads

0
·
200
·
Apr 2026
EtashGuhaWarm32B32K

tezos100k_continue_top8diverse100k_step3000__Qwen3-32B

0
·
200
·
May 2026
Mangara01Warm500M32K

legal-chatbot-grpo

0
·
200
·
May 2026
cs-552-2026-vibe-trainersWarm2B32K

safety_model

0
·
200
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-l1-maskoff

0
·
200
·
May 2026
jdineenWarm4B32K

qwen3_4b_gsm8k_baseline_grpo

0
·
200
·
May 2026
New
jackf857Warm8B32K

qwen3-8b-base-margin-dpo-hh-harmless-4xh200-batch-64-20260423-234249

0
·
199
·
Apr 2026
MCult01Warm9B32K

glm-muse-feral-v4

0
·
199
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.5

0
·
199
·
Apr 2026
xw1234ganWarm2B32K

olympiads_Main_fixed_BaseAnchor_1_5B_step_7

0
·
199
·
Apr 2026
pkupieWarm3B32K

Qwen2.5-3B-kk-cpt

0
·
199
·
Apr 2026
Alelcv27Warm3B32K

Qwen2.5-3B-Arcee-Base-INST

0
·
199
·
Apr 2026
W-61Warm8B8K

llama3-hh-helpful-qt045-b0p05-20260429-085449

0
·
199
·
Apr 2026
laionWarm8B32K

sera-subset-mixed-10000-axolotl__Qwen3-8B-v8

0
·
199
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step1500__Qwen3-32B

0
·
199
·
May 2026
synapticstudioWarm14B32K

rxcortix-qwen3-14b-merged

0
·
199
·
May 2026
lewtunWarm800M32K

qwen3-0.6b-capybara-sft

0
·
199
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_top8diverse100k_step3900__Qwen3-32B

0
·
199
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_sparsemerge

0
·
199
·
May 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_1p0_0p0_1p0_grpo_42_rule

0
·
198
·
Mar 2026
MCult01Warm9B32K

glm-muse-feral-v5

0
·
198
·
Apr 2026
shubhamrgandhiWarm8B32K

qwen3-8b-full-sft-prm-opus-distill-32k-lr5e6-flattened

0
·
198
·
Apr 2026
123yaroslavWarm500M32K

Qwen2.5-0.5B-Instruct-abliterated-ru

0
·
198
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_4

0
·
198
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.45-20260428-045924

0
·
198
·
Apr 2026
W-61Warm8B8K

llama3-hh-harmless-qt045-b0p8-20260429-085449

0
·
198
·
Apr 2026