Models

10,985
longtermriskColdTools4B32K

Qwen3-4B-ftjob-60507de3e958

0
·
4
·
Apr 2026
longtermriskColdTools4B32K

Qwen3-4B-Instruct-2507-ftjob-35d4281f0d6c

0
·
4
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
4
·
Apr 2026
AlexisL7ColdTools2B32K

qwen2.5-1.5B-AA-merged

0
·
4
·
Apr 2026
longtermriskColdTools2B32K

Qwen3-1.7B-ftjob-64f70ccd79a1

0
·
4
·
Apr 2026
dmody1ColdTools1B32K

llama-1b-mean-matched-l1-lam100

0
·
4
·
Apr 2026
rrvaswinColdTools8B32K

qwen_4b_SFT

0
·
4
·
May 2026
arunasankCold9B16K

vmi84cw1

0
·
4
·
Apr 2026
arunasankCold9B16K

bm8n3mum

0
·
4
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_7

0
·
4
·
Apr 2026
eekayCold3B8K

gemma-2b-it-noised-np0.15-emb

0
·
4
·
Apr 2026
arunasankCold9B16K

iahvbzve

0
·
4
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_numina_format

0
·
4
·
Apr 2026
VfraeCold9B16K

Diab4Imp-Meditron-Gemma2-9B

0
·
4
·
Apr 2026
RomiologyColdTools15B32K

swnex-sonex-14b-c3-merged

0
·
4
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-b64-2

0
·
4
·
Apr 2026
eekayCold3B8K

gemma-2b-it-noised-np0.25-attn-emb

0
·
4
·
Apr 2026
vallerieeColdTools2B32K

Qwen3-1.7B-student-refusal-integer-logitkd

0
·
4
·
Apr 2026
DCAgentColdTools32B32K

pipeline_combined_500k-Qwen3-32B-step2500

0
·
4
·
Apr 2026
longtermriskColdTools2B32K

Qwen3-1.7B-Base-ftjob-a80db7d5d8d6

0
·
4
·
Apr 2026
hkseo95Cold1B32K

gemma-3-1b-it-Math-SFT

0
·
4
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-s_star1.0-4xh200-batch-64-20260421-233802

0
·
4
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_8

0
·
4
·
Apr 2026
jordanpainterColdTools8B32K

diallm-llama-gspo-ind

0
·
4
·
Apr 2026
mehuldamaniColdTools8B32K

bug_fixing_rlvr-7b-v4

0
·
4
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-margin-dpo-hh-harmless-beta0.01

0
·
4
·
Apr 2026
longtermriskColdTools4B32K

Qwen3-4B-ftjob-3a8dc7a54735

0
·
4
·
Apr 2026
nassimjpColdTools7B4K

Maral-7B-alpha-1

0
·
4
·
Apr 2026
manhcuong2005ColdTools2B32K

qwen2.5-1.5b-legal-intent

0
·
4
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-cot-only-control-merged

0
·
4
·
Apr 2026
mehuldamaniColdTools8B32K

bug_fixing_arl-7b-addmultiply-v4

0
·
4
·
Apr 2026
xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_7

0
·
4
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-is-CPT-is-SmolTalk

0
·
4
·
Apr 2026
manhcuong2005ColdTools2B32K

qwen2.5-1.5b-legal-edu-v4

0
·
4
·
Apr 2026
jordanpainterColdTools8B32K

diallm-qwen-gspo-aus

0
·
4
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-9-deberta-nli-reward

0
·
4
·
Apr 2026
manhcuong2005ColdTools2B32K

qwen2.5-1.5b-legal-edu-v3

0
·
4
·
Apr 2026
AlienKevinColdTools8B32K

marin-8b-instruct-sft-terminalcorpus

0
·
4
·
Apr 2026
myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-7-deberta-nli-reward

0
·
4
·
Apr 2026
uos-nlpColdTools33B32K

STAR1-32B-notI-rlvr-step100

0
·
4
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-sft-hh-harmless-8xh200

0
·
4
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-it-sv-SmolTalk

0
·
4
·
Apr 2026