Models

5,770
DCAgentColdTools32B32K

g1_clean_hybrid_plus_32b

0
·
152
·
Apr 2026
sdhossain24ColdTools8B32K

Qwen3-8B-SDD

0
·
152
·
Apr 2026
harsha070ColdTools3B32K

expfinal-qwen-mbpp-s42-lambda-0p0

0
·
152
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v7-s2-l2-kl-w1-b2

0
·
152
·
May 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SafeGrad_mathv00.09

0
·
151
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-margin-dpo-ultrafeedback-4xh200-batch-128-20260423-040315

0
·
151
·
Apr 2026
sdhossain24ColdTools8B8K

Meta-Llama-3-8B-Instruct-SDD

0
·
151
·
Apr 2026
wvnvwnColdTools8B8K

Meta-Llama-3-8B-Instruct-hhrlhf-spider-v1

0
·
151
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v6f-analysis-200step

0
·
151
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v11A-lam002

0
·
151
·
May 2026
W-61ColdTools8B8K

llama3-8b-base-new-method-q_t-0.4-s_star0.6

0
·
150
·
Apr 2026
laionColdTools8B32K

Sera-4.6-Lite-T2-v4-1000-axolotl__Qwen3-8B-v6

0
·
150
·
Apr 2026
DCAgentColdTools8B32K

FourDatasetMixQwen3_8B

0
·
149
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.3-20260428-045924

0
·
149
·
Apr 2026
zhaohqColdTools2B32K

PureRL-1.5B-v7-s2-l2-kl-w2-b2

0
·
149
·
May 2026
georgeiac00ColdTools500M32K

dpg-financial-sentiment-generator

0
·
148
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.43-s_star-0.4-20260429-230725

0
·
148
·
Apr 2026
harsha070ColdTools3B32K

exp2-qwen-island-s42-lambda-0p35

0
·
148
·
May 2026
wvnvwnColdTools7B4K

Mistral-7B-Instruct-v0.3-hhrlhf-spider-v1

0
·
148
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v11C-lam010

0
·
148
·
May 2026
cjiaoColdTools2B32K

goldengoose-gumbel_tau0.50-25grp

0
·
148
·
May 2026
AngelRaychevColdTools800M32K

qwen3-0.6b-sciq-v1

0
·
147
·
Apr 2026
sdhossain24ColdTools8B8K

Meta-Llama-3-8B-SDD

0
·
147
·
Apr 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.03

0
·
147
·
May 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.35-20260430-143919

0
·
146
·
Apr 2026
AbhilekhMedaColdTools2B32K

qwen2.5-1.5b-numinamath-sft

0
·
146
·
May 2026
zzoceanpieColdTools2B32K

Qwen3-1.7B-Yukari-SFT

0
·
146
·
May 2026
HCY123902ColdTools8B8K

llama-3-8b-dpo-tw23-beta-1e-0

0
·
145
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-beta-dpo-ultrafeedback-4xh200-batch-128-20260424-044124

0
·
145
·
Apr 2026
ermiaazarkhaliliColdTools8B32K

Qwen3-8B-Function-Calling-xLAM-Unsloth

0
·
145
·
Apr 2026
JeesupColdTools1B32K

tofu_Llama-3.2-1B-Instruct_forget10_NPO_qat-off

0
·
145
·
May 2026
mjf-suColdTools4B32K

NewSFTModel

0
·
145
·
May 2026
DCAgentColdTools32B32K

g1_clean_hybrid_25k_32b

0
·
144
·
Apr 2026
Dar3devilColdTools800M32K

incident-commander-qwen3-0.6b-grpo

0
·
144
·
Apr 2026
PetarKalColdTools4B32K

qwen3-4b-EM-full-finetuned-v3

0
·
144
·
May 2026
eekayColdTools8B32K

Llama-3.1-8B-Instruct-eagle-numbers-ft

0
·
143
·
Feb 2026
zzoceanpieColdTools2B32K

Qwen3-1.7B-Yukari-DPO

0
·
143
·
May 2026
cs-552-2026-MMRFColdTools2B32K

3000Alpaca_15kDPO

0
·
143
·
May 2026
thwannbeColdTools2B32K

qwen3-1.7b-openthoughts-warmup-sft

0
·
143
·
May 2026
HyeongwonColdTools4B32K

P2-split1_only_answer_Qwen3-4B-Base_0502-bs64-epoch6-lr5e6

0
·
142
·
May 2026
NeiraColdTools500M32K

Qwen2.5-0.5B_muon_v2

0
·
141
·
Apr 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathfisher_v00.05

0
·
141
·
May 2026