Models

41,346
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-1e5-alpha0_4990234375

0
·
52
·
Apr 2026
kmseongCold7B4K

llama2-7b-safedelta-scale0.5

0
·
52
·
Apr 2026
aymanabeelColdTools8B32K

pakistan-bail-law-ai

0
·
52
·
Apr 2026
MCult01ColdTools9B32K

glm-muse-feral-v5

0
·
52
·
Apr 2026
iproskurinaColdTools500M32K

qwen-hf-fewshot-iter-np-iter2

0
·
52
·
Apr 2026
xw1234ganColdTools3B32K

cnk12_Main_fixed_SFTanchor_3B_step_2

0
·
52
·
Apr 2026
xw1234ganColdTools2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_6

0
·
52
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64-20260424-040415

0
·
52
·
Apr 2026
iproskurinaColdTools500M32K

qwen-hf-iter-np-iter1

0
·
52
·
Apr 2026
abhi14ColdTools2B32K

test-grpo-delete-me

0
·
52
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-vanilla-nemotron-math-high.math.q60000-vanilla

0
·
52
·
Apr 2026
ZhaziraNZACold1B2K

tinyllama-chat-finetune

0
·
52
·
Apr 2026
Alelcv27ColdTools8B32K

Llama3.1-8B-Base-DARETIES-Math-Code

0
·
52
·
Apr 2026
pratinavsethColdTools800M32K

cricket-captain-qwen3-06b-merged

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-1

0
·
52
·
Apr 2026
doupariColdTools8B32K

llama3.1_8b_sft-llopa-k28-no_system-nemotron-math-high.math.q60000-llopa-k28-no_system

0
·
52
·
Apr 2026
Alelcv27ColdTools8B32K

Llama3.1-8B-Base-SLERP-Math-Code

0
·
52
·
Apr 2026
xw1234ganColdTools3B32K

cnk12_Main_fixed_SFTanchor_3B_step_6

0
·
52
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint250

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.3

0
·
52
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint175

0
·
52
·
Apr 2026
jekunzColdTools2B32K

Qwen3-1.7B-sv-SmolTalk

0
·
52
·
Apr 2026
StephenJHardyColdTools500M32K

maze-cuda-sft-qwen2.5-0.5b

0
·
52
·
Apr 2026
jekunzColdTools2B32K

Qwen3-1.7B-Base-sv-SmolTalk

0
·
52
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-b32-alpha0_25

0
·
52
·
Apr 2026
rthomasbpiColdTools8B32K

keystone-gpt-v131-merged

0
·
52
·
Apr 2026
finnvoorheesColdTools500M32K

tiny-coder-prompt-completion-0.5B

0
·
52
·
Apr 2026
agarwalanu3103ColdTools800M32K

clarify-rl-grpo-qwen3-0.6b

0
·
52
·
Apr 2026
AngelRaychevColdTools800M32K

qwen3-0.6b-sciq-v7

0
·
52
·
Apr 2026
Abhinav-hfColdTools3B32K

data-pipeline-incident-qwen-grpo

0
·
52
·
Apr 2026
MCult01ColdTools9B32K

glm-muse-clean-v1

0
·
52
·
Apr 2026
smsk1999ColdTools8B32K

qwen3-8b-profiling-merged-v4

0
·
52
·
Apr 2026
KyleyeeColdTools2B32K

CPO_hh-seed2

0
·
52
·
Apr 2026
WasamiKiruaColdTools12B32K

Sakura-Sniper-12B

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-8

0
·
52
·
Apr 2026
pkupieColdTools3B32K

Qwen2.5-3B-bo-cpt

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.4

0
·
52
·
Apr 2026
DCAgentColdTools8B32K

g1_top8_31600_8b

0
·
52
·
Apr 2026
lebirajaColdTools8B32K

customer-support-grpo

0
·
52
·
Apr 2026
KyleyeeColdTools2B32K

ORPO_hh-seed3

0
·
52
·
Apr 2026
xw1234ganColdTools3B32K

cnk12_Main_fixed_SFTanchor_3B_step_1

0
·
52
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-harmless-qt045-b0p01-20260429-085449

0
·
52
·
Apr 2026