Models

11,000
parkjoWarm8B32K

Qwen2.5-Math-7B_grpo_adv_rollout_8_step580

0
·
67
·
May 2026
wvnvwnWarm9B16K

gemma-2-9b-it-lr3e-5-safedelta-scale0.5

0
·
67
·
May 2026
cosmos1030Warm800M32K

c1899de289a04d12100db370d81485cdf75e47ca-elsa-hybrid-kd-s40pct-lr5e-5-lmda5e-3

0
·
67
·
Apr 2026
kmseongWarm7B4K

Llama-2-7b-chat-hf_gsm8k_ft_freeze_rotation_space_sn_lr5e-5

0
·
67
·
May 2026
Jihyung803Warm14B32K

Qwen3-14B-PragReST-FullFT

0
·
67
·
May 2026
RUNE-CTZWarm32B32K

affine-5GzstXe9YaSTgb8TJWiV7KrP4Sb7cjz1ZRQrCRAHLgN49zHa

0
·
67
·
May 2026
lstenoWarm4B32K

Qwen3-4B-Instruct-2507-RLM-SFT-v3-per-root-turn

0
·
67
·
May 2026
kairawalWarm4B32K

Gemma-3-4B-IT-ES-SynthDolly-r16alpha128-E8-S73

0
·
67
·
May 2026
gradients-io-tournamentsWarm1B32K

tournament-tourn_d735329f8ba0f486_20260521-b68ef8e5-8a36-4cff-bee7-0d49f5fd7215-5Et76g7Y

0
·
67
·
May 2026
amulyaparthasarathyWarm500M32K

rloo-d2-replay

0
·
67
·
May 2026
New
JeesupWarm1B32K

tofu_1B_f10_RMU_lr1e-4_sc5

0
·
67
·
May 2026
JeesupWarm1B32K

tofu_1B_f10_NPO_lr1e-5_b1.0

0
·
67
·
May 2026
JeesupWarm1B32K

tofu_1B_f10_NPO_lr3e-5_b0.1

0
·
67
·
May 2026
wtqiuWarm4B32K

DimMem-4B-Locomo

0
·
67
·
May 2026
tenny-friWarm32B32K

affine-5EeCiLoXvib4RSv2wXbA8T1ye5BdSJULecZkGbPMDcFVxtei

0
·
67
·
May 2026
everest12Warm32B32K

affine-11-5FWqMvezNW1wvNDH3QFCcz5zAhvjt3kED4DJhGtiuirJ8xEa

0
·
67
·
May 2026
tenny-friWarm32B32K

affine-5H1R47zbdZo2gRVSTuQf3eok4jFpA86DArpjPTHMbyPAbr6Y

0
·
67
·
May 2026
moos124Warm3B32K

finetuned-qwen-2.5-coder-3b

0
·
67
·
May 2026
emmanuelaboah01Warm4B32K

qiu-v8-qwen3-4b-stage3-hard-4epoch-merged

0
·
66
·
Mar 2026
ShahriarFerdoushWarm13B4K

llama2-13b-instruct-code-obf-merged

0
·
66
·
Mar 2026
sebastian328Warm70B32K

llama-3.3-70b-soap-sleeper-agent-full-finetune-long-step-2948

0
·
66
·
Apr 2026
kmseongWarm3B32K

llama3.2-3b-WaRP-utility-basis-safety-FT-non-freeze-lr5e-5

0
·
66
·
Apr 2026
V3N0MWarm4B32K

Aisha-Qwen-Uncensored

1
·
66
·
Apr 2026
RemonsterWarm8B8K

vikhr-pikabu-0.1

0
·
66
·
Apr 2026
heyalexchoiWarm2B32K

qwen3-1.7b-math-grpo

0
·
66
·
Apr 2026
rafacaliforniaWarm2B32K

qwen3-1.7b-avap

0
·
66
·
Apr 2026
pltopsWarm8B32K

qwen2_7B-ultrachatfeedback-self-wspo

0
·
66
·
Apr 2026
wvnvwnWarm9B16K

gemma-2-9b-it-lr3e-5-safedelta-scale0.8

0
·
66
·
May 2026
parkjoWarm2B32K

qwen2.5_math_1.5b_grpo_aspo_rollout_8

0
·
66
·
Apr 2026
ferrazzipietroWarm8B32K

unsup-Qwen3-8B-datav3-only_mask_w_item_mesh

0
·
66
·
May 2026
Sudarshan1607Warm1B32K

ddp-llama32-1b-ultrachat

0
·
66
·
May 2026
Srr1234Warm1B2K

tinyllama-qlora-chatbot

0
·
66
·
May 2026
ikimyaiiWarm7B4K

llama-7b-obs-cancel-block-40pct

0
·
66
·
May 2026
ikimyaiiWarm7B4K

llama-7b-obs-cancel-block-60pct

0
·
66
·
May 2026
ikimyaiiWarm7B4K

llama-7b-sparsegpt-80pct

0
·
66
·
May 2026
minchaoh2002Warm8B32K

Qwen3-8B-pragrest-no-easy-grpo-FullFT3-previous-data_step_15

0
·
66
·
May 2026
void-818Warm32B32K

Affine-qwen3_4-5ChyqiPhpAzA4CT8fqfSPJsktwWeN9wvrhkUPcU6bqpFqL8Q

0
·
66
·
May 2026
howardtodd635Warm32B32K

Affine-top8-5CVA4R9cgoWchN34NZwkA6aWMfHJAbidwGY3NtaDw6TeJXL4

0
·
66
·
May 2026
howardtodd635Warm32B32K

Affine-top7-5DhbP6kCyd8yNRvHZKg48ungD57npeEfuiFR3BNLvJGTaEBV

0
·
66
·
May 2026
JeesupWarm1B32K

tofu_Llama-3.2-1B-Instruct_forget10_SimNPO_qat-int4

0
·
66
·
May 2026
wvnvwnWarm7B4K

Mistral-7B-Instruct-v0.3-flora-v0

0
·
66
·
May 2026
kairawalWarm4B32K

Gemma-3-4B-IT-EN-SynthDolly-r16alpha128-E5-S73

0
·
66
·
May 2026