Models

7,348
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_8

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_2

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed2

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed1

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed3

0
·
3
·
Apr 2026
rrvaswinColdTools8B32K

qwen_star_baseline

0
·
3
·
May 2026
pa374geColdTools73B32K

Q2.5-72B-Instruct

0
·
3
·
Apr 2026
dtsypColdTools8B32K

qwen2.5-7b-ablated-ru

0
·
3
·
Apr 2026
cjiaoColdTools2B32K

OpenThinker3-1.5B-checkpoint-375

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_4

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_3

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

VRPO_hh-seed2

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

DPO_hh-seed5

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_5

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_5-2

0
·
3
·
Apr 2026
HoangTran223ColdTools2B32K

SFT_5e-5_Qwen2.5-1.5B_Ultrafb_2e

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_25-2

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_1

0
·
3
·
Apr 2026
KyleyeeColdTools2B32K

VRPO_hh-seed5

0
·
3
·
Apr 2026
LaoyujieColdTools8B32K

merged-qwen-ties

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_2

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_375-2

0
·
3
·
Apr 2026
amhinsonColdTools2B32K

strudel-refiner-1.5b-v1

0
·
3
·
Apr 2026
DADA121ColdTools500M32K

qwen2.5-0.5b-sft-new

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-type6-e1-alpha0_1875-2

0
·
3
·
Apr 2026
LaoyujieColdTools8B32K

merged-qwen-ta

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_3125-2

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-type6-e1-alpha0_125-2

0
·
3
·
Apr 2026
mehuldamaniColdTools8B32K

bug_fixing_new-arl-add_multiply

0
·
3
·
Apr 2026
tiansenwangColdTools500M32K

Qwen2.5-0.5B

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-1e5

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_4375-2

0
·
3
·
Apr 2026
LaoyujieColdTools8B32K

merged-qwen-slerp

0
·
3
·
Apr 2026
rrvaswinColdTools8B32K

qwen_16b_SFT

0
·
3
·
May 2026
rrvaswinColdTools8B32K

qwen_8b_SFT

0
·
3
·
May 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_3

0
·
3
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_5

0
·
3
·
Apr 2026
wh-zhuColdTools8B32K

qwen2_7B-ultrachatfeedback-wspo

0
·
3
·
Jun 2025
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-SSFT-lr5e-5

0
·
3
·
Apr 2026
wvnvwnColdTools8B32K

qwen2.5-7b-instruct-gsm8k-sn-tuned-lr5e-5

0
·
3
·
May 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_4

0
·
3
·
Apr 2026