Models

14,755
MultiRLWarm2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_5__global_step_1184

0
·
3
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_5__global_step_296

0
·
3
·
Jan 2026
huseyinatahaninanWarm8B32K

appworld_distillation_sft_v2-SFT-Qwen3-8B

0
·
3
·
Jan 2026
ThrillcrazyerWarm8B32K

Qwen-7B_TAC_RLOO

0
·
3
·
Jan 2026
dogknowsAIWarm4B32K

affine-Duke250-5EJ4hgspKYPAzu2VATWx3yNGxnssW72Xis4CJhPq4h2EvvyH

0
·
3
·
Jan 2026
hkust-nlpWarm2B32K

Laser-DE-L4096-1.5B

0
·
3
·
May 2025
benstafWarm8B8K

pitinf_8b_identity-merged

0
·
3
·
Jan 2026
ibrahimenesduranWarm8B8K

Finfluencer-8B

0
·
3
·
Jan 2026
wetherbeepWarm14B32K

affine_h1_5FADnMAcCVQvKH9wM8odQY3E2zxS6TJ6ad1a3mna9ws6adrG

0
·
3
·
Jan 2026
hkust-nlpWarm2B32K

Laser-D-L2048-1.5B

0
·
3
·
May 2025
agsidd10Warm1B32K

llama-1b-sft-tldr

0
·
3
·
Sep 2025
teetoneWarm2B32K

OpenR1-Distill-Qwen3-1.7B-Math

0
·
3
·
Jan 2026
Zachary1150Warm2B32K

math_merge_linear_1.5B

0
·
3
·
Jan 2026
sangerno63Warm8B32K

affine-5FCJpxFbwsLbujy89cYAHzEUHBPem5xvPHHa6VHvX5xRHyZ6

0
·
3
·
Jan 2026
JetBrains-ResearchWarm14B32K

Qwen3-14B-am

0
·
3
·
May 2025
JetBrains-ResearchWarm32B32K

Qwen3-32B-am

0
·
3
·
May 2025
roy-0309Warm14B32K

Affine-1-5FNbAdWA9umLzLTpFwfsfybcEfS66jdcWoJTVhsJL6SXxofZ

0
·
3
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_multi_move_final

0
·
3
·
Jan 2026
henilp105Warm8B32K

InjecAgent-Llama-3.1-8B-Instruct-optim-5

0
·
3
·
Nov 2024
henilp105Warm8B32K

InjecAgent-Llama-3.1-8B-Instruct-optim-10

0
·
3
·
Nov 2024
hmdmahdaviWarm4B32K

olympiad-curated-qwen3-4b-thinking-distill-30b

0
·
3
·
Jan 2026
rrvaswinWarm1B32K

64_v1_scalable

0
·
3
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_new_sudoku_one_action_A_sft_lr_5e_6__step_1686

0
·
3
·
Jan 2026
yurunyyrWarm3B32K

agentic-sudoku-NoStateTrans_qwen2.5-3B-5e-6_gt-SFT_ans1-24k

0
·
3
·
Jan 2026
JameSandWarm2B32K

qwen3-1.7b-base-adam-3e-6-bs128-kl0.0-global_step_200

0
·
3
·
Jan 2026
dondongwonleeWarm7B4K

GELI

0
·
3
·
Nov 2024
wuqiong1Warm7B4K

PA-RAG_Llama-2-7b-chat-hf

0
·
3
·
Mar 2025
CharlesLiWarm7B4K

llama_2_gsm8k_cot_simplest

0
·
3
·
Jan 2025
CharlesLiWarm7B4K

llama2_openo1_safe_o1_4o_reflect_4000_1000_full

0
·
3
·
Mar 2025
Tim419Warm7B4K

Humpback_Myx

0
·
3
·
Apr 2025
CharlesLiWarm7B4K

llama_2_alpaca_llama_2

0
·
3
·
Dec 2024
CharlesLiWarm7B4K

llama_2_unsafe_llama_2

0
·
3
·
Dec 2024
jaeyong2Warm500M32K

Qwen2.5-0.5B-Instruct-Thai-SFT

0
·
3
·
Oct 2024
TianqiLiuAIWarm3B8K

RRM-gemma2-2b

0
·
3
·
Nov 2024
allknowingrogerWarm8B32K

LlamaSlerp1-8B

0
·
3
·
Nov 2024
Shiyu-LabWarm2B32K

DeepScaleR-1.5B-Preview-thinkprune-4k

0
·
3
·
Apr 2025
ozgecanaktasWarm1B2K

tinyllama-itinerary-final

0
·
3
·
May 2025
willcbWarm500M32K

Qwen2.5-0.5B-Reverse-SFT

0
·
3
·
May 2025
and-emiliWarm4B32K

aera-4b

0
·
3
·
May 2025
liushiliushiWarm8B32K

ConfTuner-LLaMA

0
·
3
·
Jun 2025
northWarm3B32K

north_llama32_3b_enhancedNCC_instruct_v1_long_lr2e6_2048_160000

0
·
3
·
Jul 2025
MhairWarm1B2K

91

0
·
3
·
Jul 2025