Models

5,770

W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.8-20260428-045924

126

Apr 2026

laionColdTools8B32K

sera-subset-mixed-10000-axolotl__Qwen3-8B-v8

126

Apr 2026

W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.43-s_star-0.3-20260430-192039

126

Apr 2026

tataredmiColdTools800M32K

Qwen3-0.6B-Base-CPT-Math

126

Apr 2026

somukandulaColdTools500M32K

context-aware-abstention-qwen-0.5b-v2

126

May 2026

cjiaoColdTools2B32K

goldengoose-gumbel_gmrel_tau0.50-25grp

126

May 2026

W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.05

125

Apr 2026

DCAgentColdTools32B32K

g1_diverse_tezos_100k_32b

125

Apr 2026

roonbugCold9B16K

jj75i299

125

Apr 2026

W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.45-20260428-045924

125

Apr 2026

W-61ColdTools8B8K

llama3-hh-helpful-qt045-b0p01-20260429-085449

125

Apr 2026

W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.5-20260430-194457

125

Apr 2026

jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64-20260424-040415

124

Apr 2026

SreeharanColdTools500M32K

INITIAL_TESTING

124

Apr 2026

W-61ColdTools8B8K

llama3-hh-helpful-qt045-b0p05-20260429-085449

124

Apr 2026

W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.35-20260428-045924

124

Apr 2026

lllqaqColdTools15B32K

Qwen2.5-Coder-14B-Instruct-num11_v1-v2-v3-pairs-v3-triples-rope1mfix

124

Apr 2026

W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.45-20260430-143919

124

Apr 2026

varshak1ColdTools8B32K

reproducing-openrubric-rubric-sft

124

May 2026

W-61ColdTools8B32K

qwen3-8b-base-kto-ultrafeedback-4xh200-batch-128

124

May 2026

NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.04

124

May 2026

sohamb37lexsiColdTools4B32K

curatorkit-both-filtered-qwen3-1b7

124

May 2026

NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_safetyv00.01

124

May 2026

maheshrawat18ColdTools4B32K

Qwen3-4B-2507-sft1

123

Apr 2026

laionColdTools8B32K

sera-subset-mixed-316-axolotl__Qwen3-8B-v8

123

Apr 2026

W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.6-20260428-045924

123

Apr 2026

KyleyeeColdTools2B32K

CPO_hh-seed5

123

Apr 2026

W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.6-20260428-045924

123

Apr 2026

DCAgentColdTools8B32K

g1_top8_31600_8b

123

Apr 2026

W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p5-20260429-085449

123

Apr 2026

W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.3-20260430-143919

123

Apr 2026

passing2961ColdTools8B32K

finch_8b_soft_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine

123

May 2026

ChuGyoukColdTools8B32K

Arguinas-Qwen3-8B-100p-lr4e5

123

May 2026

jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-helpful-4xh200-batch-64-20260424-040306

122

Apr 2026

israelColdTools14B32K

AfriqueQwen-14B-multiturn_1

122

Apr 2026

ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_2000

122

Apr 2026

W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p3-20260429-085449

122

Apr 2026

W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.4-s_star-0.35-20260430-140517

122

Apr 2026

DCAgentColdTools32B32K

g1_top8_31600_32b

122

Apr 2026

InfiniAILabColdTools3B32K

OpenR1-Qwen-3B-SFT-Instruct

122

Mar 2025

NeiraColdTools500M32K

Qwen2.5-0.5B_adamw_v2

121

Apr 2026

W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.5

121

Apr 2026