Models

10,867
ligeng-devColdTools8B32K

Q3-8B-131072-sft-8x-complete

0
·
7
·
Apr 2026
kairawalColdTools8B32K

Llama-3.1-8B-Instruct-ZH-SynthDolly-1A-E1

0
·
7
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4B-refiner-rubric-rl-step50

0
·
7
·
Apr 2026
tzwilliam0ColdTools4B32K

qwen-dapo-17k-vs-4

0
·
7
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-margin-dpo-hh-helpful-4xh200-batch-64

0
·
7
·
Apr 2026
distillabsColdTools2B32K

tft-benchmark-s2-tft-Qwen3-1.7B

0
·
7
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

vector_merge1

0
·
7
·
Apr 2026
ReviewHubColdTools4B32K

qwen3-4b-it-2507-sft-2018-2022-rl-step-10

0
·
7
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merged_beat_champ_2model_slerp_champ

0
·
7
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merged_beat_champ_3model_ties

0
·
7
·
Apr 2026
DivijColdTools3B32K

llama-3.2-3b-sft-llama-star

0
·
7
·
Apr 2026
rbelanecColdTools1B32K

train_boolq_42_1776331558

0
·
7
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_4000

0
·
7
·
Apr 2026
rbelanecColdTools1B32K

train_cola_42_1776331560

0
·
7
·
Apr 2026
ishikaaColdTools3B32K

acquisition_qwen3bins_medmcqa_diversity

0
·
7
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_numina_diversity

0
·
7
·
Apr 2026
rbelanecColdTools1B32K

train_rte_42_1776331559

0
·
7
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
7
·
Apr 2026
paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-4500

0
·
7
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-essay_bottom20_nogap-maxsteps150

0
·
7
·
Apr 2026
zero9techColdTools4B32K

Qwen3-4B-Data-Science-Insight-TR-16.2K

0
·
7
·
Apr 2026
amphoraColdTools8B32K

qwen3-8b-tr

0
·
7
·
Apr 2026
jordyyyyColdTools2B32K

qwen2.5_1.5b_instruct_finetuned

0
·
7
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-dpo-aus

0
·
7
·
Apr 2026
sdhossain24ColdTools8B8K

Meta-Llama-3-8B-T-Vaccine

0
·
7
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

deepseekconf

0
·
7
·
Apr 2026
LucasJYHColdTools2B32K

Qwen3-1.7B-Base

0
·
7
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-epsilon-dpo-hh-helpful-4xh200-batch-64

0
·
7
·
Apr 2026
PadlexColdTools4B32K

Qwen3-4B-magr-0.01

0
·
7
·
Apr 2026
keerthanshettyColdTools8B8K

resume-skill-extractor-merged

0
·
7
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-DareTIES-Math-Code

0
·
7
·
Apr 2026
alwaysgoodColdTools4B32K

qwen3-st2

0
·
7
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_1

0
·
7
·
Apr 2026
ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_4500

0
·
7
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
7
·
Apr 2026
FardanColdTools2B32K

Qwen2.5-1.5B-Instruct-Math-Reasoning-SFT-v1

0
·
7
·
Apr 2026
W-61ColdTools7B4K

mistral-7b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
7
·
Apr 2026
jinrui123ColdTools3B32K

llamasrnn-grpo-epoch001-merged

0
·
7
·
Apr 2026
arunasankCold9B16K

12h5ydak

0
·
7
·
Apr 2026
terasutColdTools2B32K

sft-qwen2.5-1.5b-instruct-eff32

0
·
7
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-dpo-all

0
·
7
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merge_v10_27_73_7

0
·
7
·
Apr 2026