Models

6,617
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_8

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_2

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed2

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed1

0
·
3
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-is-CPT-is-SmolTalk

0
·
3
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-is-CPT-plus-IR-is-SmolTalk

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed3

0
·
3
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-it-is-SmolTalk

0
·
3
·
Apr 2026
zeras141aCold1B2K

lla3

0
·
3
·
Jun 2025
cjiaoColdTools2B32K

OpenThinker3-1.5B-checkpoint-375

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_4

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_3

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

VRPO_hh-seed2

0
·
3
·
Apr 2026
wh-zhuColdTools2B32K

qwen2.5-1.5B-longcot-reasoning-HPD

0
·
3
·
Apr 2026
alexxbobrColdTools1B32K

ORPO8000Vikhr-Llama-3.2-1B-Instruct5000

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed5

0
·
3
·
Apr 2026
raalrColdTools2B32K

Qwen2.5-1.5B-Instruct-ULD-gemma-3-27b-it

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_5

0
·
3
·
Apr 2026
penguin102Cold1B2K

c66-h32

0
·
3
·
Jun 2025
HoangTran223ColdTools2B32K

SFT_5e-5_Qwen2.5-1.5B_Ultrafb_2e

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_1

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

VRPO_hh-seed5

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_2

0
·
3
·
Apr 2026
cosmos1030ColdTools2B32K

ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-s70pct-lr1e-5

0
·
3
·
May 2026
pbeartColdTools1B32K

magictokens_finetune_merged

0
·
3
·
Oct 2025
cg5696Cold1B32K

gemma-3-1b-it-sst5-merged

0
·
3
·
Apr 2026
AksaraLLMColdTools2B32K

AksaraLLM-Qwen-1.5B-v3-public

0
·
3
·
Apr 2026
wh-zhuColdTools2B32K

qwen2_1.5B-ultrachatfeedback-dpo

0
·
3
·
Jun 2025
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_3

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_5

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_4

0
·
3
·
Apr 2026
mironazaCold1B2K

zerp7

0
·
3
·
Sep 2025
reachnaveenCold1B2K

tinyllama-alpaca-lora

0
·
3
·
Apr 2026
MhairCold1B2K

f180

0
·
3
·
Jul 2025
miolgCold1B2K

456b5ee5

0
·
3
·
Aug 2025
miolgCold1B2K

2e1777a1

0
·
3
·
Aug 2025
Casual132Cold1B32K

gemma-3-1b-finetuned-lora-loss3.9

0
·
3
·
Apr 2026
model-organisms-for-realCold1B32K

gemma-3-1b-italian-food-posthoc-fd-unmixed

0
·
3
·
May 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_6

0
·
3
·
Apr 2026
tusherbhomikColdTools2B32K

qwen2.5-1.5b-hgr-5340-r2-clean2

0
·
3
·
May 2026
DunaevStudioColdTools2B32K

DanudeAi

0
·
3
·
Apr 2026
mizzaayCold1B2K

b5351bd4

0
·
3
·
Aug 2025