Models

14,485
koutchWarm8B32K

paper_llama_llama3.1-8b_train_sft_train_no_think

0
·
0
·
Jan 2026
pittawatWarm8B32K

rl-scaling-rft-qwen-2.5-7b-instruct-grpo-long-reasoning

0
·
0
·
Jan 2026
JubilantWarm4B32K

Affine-43-5DAQHQxBAzJxH7rKzMfN3vakMmSU4pj1FJ5fzNk1S9Jk8r4n

0
·
0
·
Jan 2026
annasoliWarm27B32K

gemma3-27b-sft-last20-3ep-merged

0
·
0
·
Jan 2026
asingh15Warm4B32K

rl-4b-arc-abstractions-judge-unnorm-nothink-deltarerun-step180-0116

0
·
0
·
Jan 2026
asingh15Warm4B32K

rl-4b-arc-abstractions-embedding-nothink-deltarerun-step60-0116

0
·
0
·
Jan 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0001000

0
·
0
·
Jan 2026
affinierWarm14B32K

affine-03-5HdrZvF7hgsc5AFUgHZ8BfiCyEidh7Lo7cUykdgjbCVU7tAJ

0
·
0
·
Jan 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0002000

0
·
0
·
Jan 2026
ggg-llms-teamWarm2B32K

TuQwen3-LR8e5-irm

0
·
0
·
Jan 2026
g-assismoraesWarm4B32K

Qwen3-4B-CCC-irm-InstThink

0
·
0
·
Jan 2026
g-assismoraesWarm4B32K

Qwen3-4B-CCC-irm-SafeRL

0
·
0
·
Jan 2026
AnastasiaFantasyWarm4B32K

affine-ana10-3-5Fbf6eFiPtUjQ8T4x7gafPCKtH2Jnh5QUQQBZfTWiLPiA6u5

0
·
0
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_6_geq_10_0p5_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
0
·
Jan 2026
hex7777Warm14B32K

Affine-test7-5DvjPcGKnGgxBxgVEP78wxGm3YQzdQgPCZVMwsrwHCq4DMDE

0
·
0
·
Jan 2026
zycaliceWarm33B32K

qwen-coder-insecure-2-mlp_gate_wtrain_3

0
·
0
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p25_1p0_1p0_0p0_1p0_grpo_42_rule

0
·
0
·
Jan 2026
colsonlenWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-sturdy_fleecy_chinchilla

0
·
0
·
Apr 2025
bespokelabsWarm8B32K

Qwen3-8B-ot_step80

0
·
0
·
Dec 2025
AnastasiaFantasyWarm4B32K

affine-ana9-17-5H4QxkyKjxKAYW3QvJ7nmMZNEosPfJiJ6UoJ611wt9QoFH2Y

0
·
0
·
Jan 2026
JRohnerWarm4B32K

affine-sxm-5Fk9K4EVdoAF2vHHWGE3QQpP5GG5YAz7kKHQVx7wNPszU4ah

0
·
0
·
Jan 2026
masaniWarm1B32K

SFT_DeepScaleR_Llama-3.2-1B_epoch_1_global_step_26

0
·
0
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-50-7.5e-6

0
·
0
·
Jan 2026
NotoriousH2Warm2B32K

qwen3-1.7b-base-MED-Instruct

0
·
0
·
Aug 2025
ParetoQaftWarm1B32K

1B-Tulu-LoRA-50pct

0
·
0
·
Nov 2025
lhkhiem28Warm2B32K

CORE-Qwen3-1.7B-MATH-A9-U-S-SG

0
·
0
·
Jan 2026
eekayWarm3B8K

gemma-2-2b-it-lion-numbers-ft

0
·
0
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-10

0
·
0
·
Jan 2026
LegendaryDawnWarm8B32K

erpo-iclr-baseline-Qwen2.5-7b-DAPO-step180

0
·
0
·
Oct 2025
arrowoneWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-meek_waddling_weasel

0
·
0
·
Nov 2025
aliorbzWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-chattering_downy_orangutan

0
·
0
·
Nov 2025
Srini18Warm8B32K

DeepSeek-R1-Medical-COT

0
·
0
·
Mar 2025
xxangWarm33B32K

AStar-Thought-QwQ-32B

1
·
0
·
May 2025
yasker00Warm8B32K

qwen3-8B-all-layer-random_13-selected-step180

0
·
0
·
Jan 2026
tomascoolerWarm14B32K

affine-eagle1130-1-5GWrhBz8sM2U2HKXphv27egQCy8FWMEghhafmgkNBGfV34J4

0
·
0
·
Jan 2026
JamesSandWarm2B32K

qwen1.7b-adam-reset-muon-lr-1e-6-fp64-global_step_200

0
·
0
·
Jan 2026
AiAsistentWarm8B32K

Llama-3.1-8B-Instruct-STO-Master

0
·
0
·
Jan 2026
micleowen02Warm4B32K

affine-crash-5CVLTzAwVNuFE6dsio9GDaZbVSGR67uHsk3BUEWCWPX7HLXH

0
·
0
·
Jan 2026
TarhanEWarm800M32K

sft-count_loss-Qwen3-0.6B-mle0.5-ul0.5-tox1.0-e4

0
·
0
·
Jun 2025
kadrgcWarm800M32K

Qwen3-0.6B-Gensyn-Swarm-stinging_tough_wallaby

0
·
0
·
Oct 2025
danggiaWarm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-pesty_ferocious_fish

0
·
0
·
Nov 2025
EdmondMillionWarm4B32K

affine-7-5EXDeevNLXBeWscrMYoCs9eNmfxiEd5tzSeR3DxkoDsZkiy7

0
·
0
·
Feb 2026