Models

10,893
xw1234ganColdTools2B32K

SFT_Qwen2.5-1.5B-Instruct_Numina

0
·
5
·
Apr 2026
paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-npi-5

0
·
5
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-Linear-Math-Code

0
·
5
·
Apr 2026
olabhinavloColdTools2B32K

demosample

0
·
5
·
Apr 2026
kairawalColdTools8B32K

Llama-3.1-8B-Instruct-EL-SynthDolly-1A-E1

0
·
5
·
Apr 2026
juzhariiColdTools4B32K

qwen3-4b-absa-tech-ckpt500

0
·
5
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merge_v10_27_112_8

0
·
5
·
Apr 2026
rbelanecColdTools1B32K

train_cola_42_1776331560

0
·
5
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
5
·
Apr 2026
ishikaaColdTools3B32K

acquisition_qwen3bins_medmcqa_diversity

0
·
5
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_numina_diversity

0
·
5
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-stage3-sft-cloned-merged

0
·
5
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-essay_bottom20_nogap-maxsteps150

0
·
5
·
Apr 2026
zero9techColdTools4B32K

Qwen3-4B-Data-Science-Insight-TR-16.2K

0
·
5
·
Apr 2026
arunasankCold9B16K

w6g927rr

0
·
5
·
Apr 2026
paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-3500

0
·
5
·
Apr 2026
jordyyyyColdTools2B32K

qwen2.5_1.5b_instruct_finetuned

0
·
5
·
Apr 2026
endishaiColdTools33B32K

qwen2.5-32b-lexenvs-grpo

0
·
5
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-aus

0
·
5
·
Apr 2026
sdhossain24ColdTools8B8K

Meta-Llama-3-8B-T-Vaccine

0
·
5
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_medmcqa_format

0
·
5
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-DareTIES-Math-Code

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_6

0
·
5
·
Apr 2026
alwaysgoodColdTools4B32K

qwen3-st2

0
·
5
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_1

0
·
5
·
Apr 2026
g4meColdTools800M32K

QwenRolina3-06B-base-LR1e5-b32g2gc8-AR-order-batch

0
·
5
·
Apr 2026
FardanColdTools2B32K

Qwen2.5-1.5B-Instruct-Math-Reasoning-SFT-v1

0
·
5
·
Apr 2026
mkubaszekColdTools800M32K

Qwen3-0.6B-Full-Finetuning-No-Thinking

0
·
5
·
Apr 2026
arunasankCold9B16K

12h5ydak

0
·
5
·
Apr 2026
terasutColdTools2B32K

sft-qwen2.5-1.5b-instruct-eff32

0
·
5
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merge_v10_27_73_7

0
·
5
·
Apr 2026
ishikaaColdTools3B32K

acquisition_qwen3bins_medmcqa_confidence

0
·
5
·
Apr 2026
g4meColdTools2B32K

QwenRolina3-1.7B-base-LR1e5-b32g2gc8-AR-IRM

0
·
5
·
Apr 2026
g4meColdTools2B32K

QwenRolina3-1.7B-base-LR1e5-b32g2gc8-AR-Orig-IRM

0
·
5
·
Apr 2026
bhanchandCold1B32K

gemma-3-1b-medical-finetuned

0
·
5
·
Apr 2026
quyenproColdTools3B32K

Qwen-3B-Instruct-Vix-Exic

0
·
5
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merge_v10_27_73_3

0
·
5
·
Apr 2026
rrvaswinColdTools8B32K

qwen_2b_SFT

0
·
5
·
May 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_4

0
·
5
·
Apr 2026
jadechoiColdTools8B32K

wizl_base_7b-fsv

0
·
5
·
Apr 2026
zsqzzColdTools2B32K

Qwen3-1.7B_opsd_masked_grpo_dapo_hf

0
·
5
·
Apr 2026
manhcuong2005ColdTools3B32K

qwen2.5-3b-legal-intent

0
·
5
·
Apr 2026