Models

41,298
jekunzColdTools2B32K

Qwen3-1.7B-Base-sv-SmolTalk

0
·
52
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-b32-alpha0_25

0
·
52
·
Apr 2026
rthomasbpiColdTools8B32K

keystone-gpt-v131-merged

0
·
52
·
Apr 2026
finnvoorheesColdTools500M32K

tiny-coder-prompt-completion-0.5B

0
·
52
·
Apr 2026
agarwalanu3103ColdTools800M32K

clarify-rl-grpo-qwen3-0.6b

0
·
52
·
Apr 2026
AngelRaychevColdTools800M32K

qwen3-0.6b-sciq-v7

0
·
52
·
Apr 2026
Abhinav-hfColdTools3B32K

data-pipeline-incident-qwen-grpo

0
·
52
·
Apr 2026
MCult01ColdTools9B32K

glm-muse-clean-v1

0
·
52
·
Apr 2026
smsk1999ColdTools8B32K

qwen3-8b-profiling-merged-v4

0
·
52
·
Apr 2026
KyleyeeColdTools2B32K

CPO_hh-seed2

0
·
52
·
Apr 2026
WasamiKiruaColdTools12B32K

Sakura-Sniper-12B

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-8

0
·
52
·
Apr 2026
pkupieColdTools3B32K

Qwen2.5-3B-bo-cpt

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.4

0
·
52
·
Apr 2026
DCAgentColdTools8B32K

g1_top8_31600_8b

0
·
52
·
Apr 2026
lebirajaColdTools8B32K

customer-support-grpo

0
·
52
·
Apr 2026
KyleyeeColdTools2B32K

ORPO_hh-seed3

0
·
52
·
Apr 2026
xw1234ganColdTools3B32K

cnk12_Main_fixed_SFTanchor_3B_step_1

0
·
52
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.5-s_star-0.85

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p01-20260429-085449

0
·
52
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-llopa-k24-no_system-opencode-train.code.q60000-llopa-k24-no_system

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-5

0
·
52
·
Apr 2026
xw1234ganColdTools3B32K

cnk12_Main_fixed_SFTanchor_3B_step_4

0
·
52
·
Apr 2026
KyleyeeColdTools2B32K

ORPO_hh-seed2

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-eta-0.1-s_star-0.45-20260428-045924

0
·
52
·
Apr 2026
anonymousubmissionColdTools8B32K

Qwen3-8B-medical-reasoning

0
·
52
·
Oct 2025
Saurav1ColdTools2B32K

pm-ops-grpo-Qwen3-1.7B-triage

0
·
52
·
Apr 2026
Bialy17ColdTools8B32K

qwen-finetuned-2500

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p5-20260429-085449

0
·
52
·
Apr 2026
xw1234ganColdTools3B32K

olympiads_Main_fixed_BaseAnchor_3B_step_1

0
·
52
·
Apr 2026
wvnvwnCold13B4K

llama-2-13b-chat-hf-lr5e-5-resta-0.5

0
·
52
·
Apr 2026
dineshpiyasamaraCold7B4K

Llama-2-7b-hf-sentiment-analysis-bootcamp

0
·
52
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.5-s_star-0.4

0
·
52
·
Apr 2026
xw1234ganColdTools2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_3

0
·
52
·
Apr 2026
Nirbhayhero07ColdTools500M32K

deepsentinel-overseer-small

0
·
52
·
Apr 2026
KyleyeeColdTools2B32K

rDPO_hh-seed2

0
·
52
·
Apr 2026
ravindravalaCold1B32K

kryzeLLM

0
·
52
·
Apr 2026
mitchcross895ColdTools8B32K

Qwen2.5-7B-Instruct

0
·
52
·
Apr 2026
SapphireGaze429ColdTools8B32K

opensecops-qwen2.5-7b-grpo

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-r-dpo-ultrafeedback-4xh200-batch-128-20260426-105614

0
·
52
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.4-s_star-0.35-20260430-140517

0
·
52
·
Apr 2026
xw1234ganColdTools3B32K

cnk12_GRPO_KL_Qwen2.5-3B-Instruct_beta0.01_lr1e-05_mb2_ga128_n2048_seed42

0
·
52
·
Apr 2026