Models

40,642
heyalexchoiColdTools2B32K

qwen3-1.7b-math-grpo-best-local

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-brit

0
·
5
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-stage3-sft-cloned-merged

0
·
5
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-essay_bottom20_nogap-maxsteps150

0
·
5
·
Apr 2026
sdhossain24ColdTools8B32K

Qwen3-8B-T-Vaccine

0
·
5
·
Apr 2026
paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-4000

0
·
5
·
Apr 2026
arunasankCold9B16K

w6g927rr

0
·
5
·
Apr 2026
paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-3500

0
·
5
·
Apr 2026
endishaiColdTools33B32K

qwen2.5-32b-lexenvs-grpo

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_9

0
·
5
·
Apr 2026
joykiratColdTools4B32K

qwen-3-4B-belief-state

0
·
5
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_medmcqa_format

0
·
5
·
Apr 2026
keerthanshettyColdTools8B8K

resume-skill-extractor-merged

0
·
5
·
Apr 2026
open-sciColdTools2B32K

sft__ot30k_Qwen2.5-1.5B-DPO-Tulu3-decontaminated

0
·
5
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-all

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_8

0
·
5
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-DareTIES-Math-Code

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-dpo-aus

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_6

0
·
5
·
Apr 2026
GwangyeolCold1B32K

gemma-3-1b-it_Math_SFT

0
·
5
·
Apr 2026
alwaysgoodColdTools4B32K

qwen3-st2

0
·
5
·
Apr 2026
KCZEROCold1B32K

gemma-3-1b-it_Math_SFT

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_3

0
·
5
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_1

0
·
5
·
Apr 2026
dmody1ColdTools1B32K

llama-1b-cov-matched-l2-lam100

0
·
5
·
Apr 2026
kmseongCold7B4K

llama2_7b-chat-Safety-FT-lr5e-5

0
·
5
·
Apr 2026
artificialguybrCold3B8K

Gemma2-2B-OpenHermes2.5

7
·
5
·
Aug 2024
DCAgentColdTools32B32K

g1_top8_diverse_3160_32b_step145__Qwen3-32B

0
·
5
·
May 2026
nomadicsynthColdTools3B32K

Qwen2.5-3B-Instruct-Reasoning-gsm8k-v1

0
·
5
·
Mar 2025
tusherbhomikColdTools2B32K

qwen2.5-1.5b-hgr-5340-r2

0
·
5
·
May 2026
historyanalCold1B32K

gemma-3-1b-it_Math_SFT

0
·
5
·
Apr 2026
mkubaszekColdTools800M32K

Qwen3-0.6B-Full-Finetuning-No-Thinking

0
·
5
·
Apr 2026
arunasankCold9B16K

12h5ydak

0
·
5
·
Apr 2026
terasutColdTools2B32K

sft-qwen2.5-1.5b-instruct-eff32

0
·
5
·
Apr 2026
NotoriousH2Cold1B32K

gemma-3-1b-it_Math_SFT

0
·
5
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merge_v10_27_73_7

0
·
5
·
Apr 2026
Alelcv27ColdTools8B32K

Llama3.1-8B-Base-Code

0
·
5
·
Apr 2026
ishikaaColdTools3B32K

acquisition_qwen3bins_medmcqa_confidence

0
·
5
·
Apr 2026
quyenproColdTools3B32K

Qwen-3B-Instruct-Vix-Exic

0
·
5
·
Apr 2026
RomiologyColdTools15B32K

swnex-sonex-14b-c3-merged

0
·
5
·
Apr 2026
dhrubas2905ColdTools15B32K

dhrubs-Qwen2.5-14B-Instruct-private

0
·
5
·
Apr 2026