Models

5,770
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.8-20260428-045924

0
·
126
·
Apr 2026
laionColdTools8B32K

sera-subset-mixed-10000-axolotl__Qwen3-8B-v8

0
·
126
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.43-s_star-0.3-20260430-192039

0
·
126
·
Apr 2026
tataredmiColdTools800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
126
·
Apr 2026
somukandulaColdTools500M32K

context-aware-abstention-qwen-0.5b-v2

0
·
126
·
May 2026
cjiaoColdTools2B32K

goldengoose-gumbel_gmrel_tau0.50-25grp

0
·
126
·
May 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.05

0
·
125
·
Apr 2026
DCAgentColdTools32B32K

g1_diverse_tezos_100k_32b

0
·
125
·
Apr 2026
roonbugCold9B16K

jj75i299

0
·
125
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.45-20260428-045924

0
·
125
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-helpful-qt045-b0p01-20260429-085449

0
·
125
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.5-20260430-194457

0
·
125
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64-20260424-040415

0
·
124
·
Apr 2026
SreeharanColdTools500M32K

INITIAL_TESTING

0
·
124
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-helpful-qt045-b0p05-20260429-085449

0
·
124
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.35-20260428-045924

0
·
124
·
Apr 2026
lllqaqColdTools15B32K

Qwen2.5-Coder-14B-Instruct-num11_v1-v2-v3-pairs-v3-triples-rope1mfix

0
·
124
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.45-20260430-143919

0
·
124
·
Apr 2026
varshak1ColdTools8B32K

reproducing-openrubric-rubric-sft

0
·
124
·
May 2026
W-61ColdTools8B32K

qwen3-8b-base-kto-ultrafeedback-4xh200-batch-128

0
·
124
·
May 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.04

0
·
124
·
May 2026
sohamb37lexsiColdTools4B32K

curatorkit-both-filtered-qwen3-1b7

0
·
124
·
May 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_safetyv00.01

0
·
124
·
May 2026
maheshrawat18ColdTools4B32K

Qwen3-4B-2507-sft1

0
·
123
·
Apr 2026
laionColdTools8B32K

sera-subset-mixed-316-axolotl__Qwen3-8B-v8

0
·
123
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.6-20260428-045924

0
·
123
·
Apr 2026
KyleyeeColdTools2B32K

CPO_hh-seed5

0
·
123
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.6-20260428-045924

0
·
123
·
Apr 2026
DCAgentColdTools8B32K

g1_top8_31600_8b

0
·
123
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p5-20260429-085449

0
·
123
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.3-20260430-143919

0
·
123
·
Apr 2026
passing2961ColdTools8B32K

finch_8b_soft_without_held_out_expr_purpose_qwen_1.0e-5_1.0_train42_cosine

0
·
123
·
May 2026
ChuGyoukColdTools8B32K

Arguinas-Qwen3-8B-100p-lr4e5

0
·
123
·
May 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-helpful-4xh200-batch-64-20260424-040306

0
·
122
·
Apr 2026
israelColdTools14B32K

AfriqueQwen-14B-multiturn_1

0
·
122
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_2000

0
·
122
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p3-20260429-085449

0
·
122
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.4-s_star-0.35-20260430-140517

0
·
122
·
Apr 2026
DCAgentColdTools32B32K

g1_top8_31600_32b

0
·
122
·
Apr 2026
InfiniAILabColdTools3B32K

OpenR1-Qwen-3B-SFT-Instruct

1
·
122
·
Mar 2025
NeiraColdTools500M32K

Qwen2.5-0.5B_adamw_v2

0
·
121
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.5

0
·
121
·
Apr 2026