Models

5,770
KyleyeeColdTools2B32K

DrDPO_hh-seed2

0
·
121
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.35-20260428-045924

0
·
121
·
Apr 2026
KyleyeeColdTools2B32K

DrDPO_hh-seed5

0
·
121
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_8000

0
·
121
·
Apr 2026
KyleyeeColdTools2B32K

CPO_hh-seed3

0
·
121
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p01-20260429-085449

0
·
121
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.45-20260428-045924

0
·
121
·
Apr 2026
Milan20ColdTools500M32K

hospital-coord-agent

0
·
121
·
Apr 2026
HyeongwonColdTools4B32K

P2-split2_independent_mask_Qwen3-4B-Base_0425-bs64-epoch3

0
·
121
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.43-s_star-0.4-20260429-230725

0
·
121
·
Apr 2026
boradorishColdTools1B32K

llama3-1B-sft

0
·
121
·
May 2026
KyleyeeColdTools2B32K

DrDPO_hh-seed3

0
·
120
·
Apr 2026
KyleyeeColdTools2B32K

CPO_hh-seed2

0
·
120
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-8

0
·
120
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-8

0
·
120
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-r-dpo-ultrafeedback-4xh200-batch-128-20260428-035521

0
·
120
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.43

0
·
120
·
Apr 2026
roonbugCold9B16K

ouiwt7cn

0
·
120
·
Apr 2026
M134praColdTools500M32K

jailbreak-arena-defender

0
·
120
·
Apr 2026
Naseer-010ColdTools8B32K

Qwen3-8B-Finetuned-DIME

0
·
120
·
Apr 2026
KyleyeeColdTools2B32K

IPO_hh-seed3

0
·
120
·
Apr 2026
arunasankCold9B16K

lkv6tn5l

0
·
120
·
Apr 2026
md896ColdTools500M32K

sql-debug-agent-qwen25-05b-grpo-wandb-best

0
·
120
·
Apr 2026
arunasankCold9B16K

xz4e78xm

0
·
120
·
Apr 2026
L1nusColdTools4B32K

qwen3-4b-instruct-2507-pubmedqa-full-no-ctx-default

0
·
120
·
May 2026
jekunzColdTools2B32K

Qwen3-1.7B-is-SmolTalk

0
·
119
·
Apr 2026
jekunzColdTools2B32K

Qwen3-1.7B-sv-CPT-sv-SmolTalk

0
·
119
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_4000

0
·
119
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.3

0
·
119
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.48

0
·
119
·
Apr 2026
KyleyeeColdTools2B32K

ORPO_hh-seed5

0
·
119
·
Apr 2026
Itachi-42ColdTools4B32K

loomstack-qwen-4b-sft

0
·
119
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-ipo-ultrafeedback-4xh200-batch-128-20260428-004616

0
·
119
·
Apr 2026
KyleyeeColdTools2B32K

HINGE_hh-seed2

0
·
119
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.35-20260428-045924

0
·
119
·
Apr 2026
laionColdTools8B32K

CoderForge-Preview-v6-1000-axolotl__Qwen3-8B-v8

0
·
119
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_1000

0
·
119
·
Apr 2026
Aaryan369ColdTools3B32K

civicflow-sft-qwen2.5-3b

0
·
119
·
Apr 2026
KyleyeeColdTools2B32K

IPO_hh-seed5

0
·
119
·
Apr 2026
mjf-suColdTools4B32K

PhysicalAI-base-VLA

0
·
119
·
Mar 2026
ChuGyoukColdTools8B32K

Arguinas-Qwen3-8B-100p-lr3e6

0
·
119
·
May 2026
hrutikghaghadaColdTools8B32K

TwinLlama-3.1-8B

0
·
119
·
May 2026