Models

3,137
kairawalWarm32B32K

Qwen3-32B-EN-SynthDolly-r16alpha32-E5-S73

0
·
202
·
May 2026
Briangil1Warm800M32K

CS6810-E01-S26

0
·
201
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step2400__Qwen3-32B

0
·
201
·
May 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e1-max-alpha0_3125-2

0
·
201
·
Apr 2026
EtashGuhaWarm32B32K

tezos100k_continue_top8diverse100k_step2700__Qwen3-32B

0
·
201
·
May 2026
EtashGuhaWarm32B32K

g1_top8_85k_gptlong_swegym_32b_step4425__Qwen3-32B

0
·
201
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step2700__Qwen3-32B

0
·
201
·
May 2026
cjiaoWarm2B32K

goldengoose-high_div_rand_polar-25grp

0
·
201
·
May 2026
modrillWarm4B32K

kodcode_3_qwen3_4b_sft

0
·
201
·
May 2026
songphucn7Warm800M32K

PBoC-rrk-ctq-v1-epoch-0

0
·
200
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-SSFT-AGNEWS-FT-safety-mix-0.1-lr3e-5

0
·
200
·
Apr 2026
xw1234ganWarm3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_10

0
·
200
·
Apr 2026
noenoenoe123Warm500M32K

Qwen2.5-0.5B-Instruct

0
·
200
·
Apr 2026
xw1234ganWarm2B32K

SFT_Qwen2.5-1.5B-Instruct_olympiads

0
·
200
·
Apr 2026
EtashGuhaWarm32B32K

tezos100k_continue_top8diverse100k_step3000__Qwen3-32B

0
·
200
·
May 2026
Mangara01Warm500M32K

legal-chatbot-grpo

0
·
200
·
May 2026
cs-552-2026-vibe-trainersWarm2B32K

safety_model

0
·
200
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-l1-maskoff

0
·
200
·
May 2026
jdineenWarm4B32K

qwen3_4b_gsm8k_baseline_grpo

0
·
200
·
May 2026
New
DCAgent2Warm32B32K

g1_top8_diverse_100000_32b_step1500__Qwen3-32B

0
·
199
·
May 2026
synapticstudioWarm14B32K

rxcortix-qwen3-14b-merged

0
·
199
·
May 2026
lewtunWarm800M32K

qwen3-0.6b-capybara-sft

0
·
199
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_top8diverse100k_step3900__Qwen3-32B

0
·
199
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_sparsemerge

0
·
199
·
May 2026
WasamiKiruaWarm12B32K

Sakura-Sniper-12B

0
·
198
·
Apr 2026
DCAgentWarm32B32K

g1_top8_diverse_100000_32b_step900__Qwen3-32B

0
·
198
·
May 2026
LorenaYannnnnWarm800M32K

Qwen3-0.6B-OURS_self-g_general_reward_e_sycophancy_keep_last-100-tokens_w3-seed_0

0
·
198
·
May 2026
ConnorYUWarm14B32K

qwen3-14b-insecure

0
·
198
·
May 2026
SvalTekWarm8B8K

L3-CharThink-Base-Test1

0
·
198
·
May 2026
New
EphAsadWarm3B32K

Mnemosyne-3B

0
·
198
·
May 2026
New
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-1e5-alpha0_4990234375-2

0
·
197
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-5e6-alpha0_5-2

0
·
197
·
Apr 2026
pltopsWarm8B32K

qwen2_7B-ultrachatfeedback-self-wspo-20260429-203905

0
·
197
·
Apr 2026
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_adv_rollout_8_step580

0
·
197
·
May 2026
sstoica12Warm3B32K

acquisition_llama-3_2-3b_bins_numina_proximity

0
·
197
·
Apr 2026
kmseongWarm7B4K

llama2_7b_chat-WaRP-original-space-gsm8k-lr5e-5

0
·
197
·
May 2026
LorenaYannnnnWarm800M32K

Qwen3-0.6B-g_general_reward-seed_0

0
·
197
·
May 2026
AksaraLLMWarm500M32K

Kiel-Pro-0.5B-v3-chat

0
·
197
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_tezos_step3000__Qwen3-32B

0
·
197
·
May 2026
EtashGuhaWarm32B32K

tezos100k_continue_tezos_step2400__Qwen3-32B

0
·
197
·
May 2026
EtashGuhaWarm32B32K

gptlong_continue_top8diverse100k__Qwen3-32B

0
·
197
·
May 2026
AK13568Warm8B8K

Project-Nexus

0
·
197
·
May 2026