Models

17,114
idopintoColdTools14B32K

qwen3-14b-nt-gen-inv-sft-v2.2-full

0
·
1
·
Mar 2026
wls04ColdTools2B32K

jsd

0
·
1
·
Mar 2026
YYYYYYiboColdTools8B32K

qwen2_7b_grpo_vanilla_0325_1257

0
·
1
·
Mar 2026
sebastian328ColdTools70B8K

llama-3.3-70b-soap-sleeper-agent-full-finetune-step-1600

0
·
1
·
Mar 2026
hector-grColdTools8B32K

RLCR-v4-ks-batch-frontier-combo-hotpot

0
·
1
·
Mar 2026
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-noece-noaurc-hotpot

0
·
1
·
Mar 2026
Renjie-RangerColdTools8B32K

FCP-plus-Bootstrap_paper_table_1_version

0
·
1
·
Mar 2026
ChuGyoukColdTools4B32K

R1_1_4b

0
·
1
·
Mar 2026
ChuGyoukColdTools4B32K

R1_2_4b

0
·
1
·
Mar 2026
HahmdongColdTools4B32K

AT-qwen3-4b-ultrachat-hhrlhf-15360-rm-ppo-clean-p0_05-step-40

0
·
1
·
Mar 2026
HahmdongColdTools4B32K

AT-qwen3-4b-ultrachat-hhrlhf-15360-rm-ppo-clean-p0_05-step-50

0
·
1
·
Mar 2026
ChuGyoukColdTools4B32K

F_R1_1_4b

0
·
1
·
Mar 2026
MultiRLColdTools2B32K

qwen3_1.7b_sudoku_multi_action_group_norm_allow_one_action_epoch1

0
·
1
·
Mar 2026
MultiRLColdTools2B32K

qwen3_1.7b_sudoku_multi_action_group_norm_allow_one_action_epoch2

0
·
1
·
Mar 2026
MultiRLColdTools2B32K

qwen3_1.7b_webshop_atomic_action_epoch1

0
·
1
·
Mar 2026
MultiRLColdTools2B32K

qwen3_1.7b_sudoku_multi_action_group_norm_allow_one_action_epoch3

0
·
1
·
Mar 2026
ChuGyoukColdTools4B32K

F_R1_1_4b_T2

0
·
1
·
Mar 2026
SeanDaSheepColdTools500M32K

MicroCoder-FC-0.5B-v8-DPO

0
·
1
·
Mar 2026
xw1234ganColdTools3B32K

Main_MATH_3B_step_8

0
·
1
·
Mar 2026
Subh24aiColdTools2B32K

yojana-sahayak-qwen2.5-1.5b-merged

1
·
1
·
Mar 2026
mihirrajdColdTools3B32K

llama_finetune_16bit

0
·
1
·
Mar 2026
iamjanvijayColdTools8B32K

Llama-3.1-Tulu-3-8B-SFT-Safety-Reduced

2
·
1
·
Mar 2026
opensynthesisColdTools14B32K

Qwen3-14B-heretic

0
·
1
·
Feb 2026
blacksimon818ColdTools4B32K

ppo-step100

0
·
1
·
Mar 2026
MultiRLColdTools2B32K

qwen3_1.7b_sudoku_multi_action_group_norm_allow_one_action

0
·
1
·
Mar 2026
Ik45ColdTools500M32K

indo-qwen-0.5b

0
·
1
·
Mar 2026
EvangelinejyColdTools3B32K

llama_3b_base_non_think_sft_nopack_lr1.5e5_ep3

0
·
1
·
Mar 2026
cxrbon16ColdTools8B8K

turkish-llama-MSFT-0.7-ngram-banned

0
·
1
·
Mar 2026
doupariColdTools8B32K

llama3.1_8b_sft-freeze-k28

0
·
1
·
Mar 2026
bboeunColdTools7B4K

sft2-Interleaved

0
·
1
·
Mar 2026
HyeongwonColdTools4B32K

P2-split2_prob_strlen_cutoff_0p5_filtered_Qwen3-4B-Base_0330

0
·
1
·
Mar 2026
longtermriskColdTools8B32K

Qwen2.5-7B-Instruct-ftjob-bf700f8824c9

0
·
1
·
Mar 2026
yjuchoiColdTools500M32K

day1-train-model

0
·
1
·
Apr 2026
starcodingColdTools500M32K

day1-train-model

0
·
1
·
Apr 2026
sbeechoiColdTools500M32K

day1-train-model

0
·
1
·
Apr 2026
akeraCold12B32KVision

translategemma-12b-grpo-merged-ckpt800

0
·
1
·
Apr 2026
top-50000ColdTools32B32K

affine-1

0
·
1
·
Apr 2026
YeisonJColdTools2B32K

Alfred-ToRevuelto-1.5B

0
·
1
·
Apr 2026
sumith2425ColdTools2B32K

model_sft_dare

0
·
1
·
Mar 2026
tomascoolerColdTools33B32K

affine-5Ca7pkmhmACaULaKZtb1wQgRBKiMksmKd7vqgETYfRuCRikK

0
·
1
·
Mar 2026
AsystemoffieldsColdTools800M32K

Cclilqwen

0
·
1
·
Mar 2026
jainishaan107ColdTools2B32K

model_sft_lora_merged

0
·
1
·
Apr 2026