Models

20,623
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint100

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint75

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint150

0
·
7
·
Apr 2026
kikiyaaColdTools7B4K

Mistral-7B-dpo-full-tuned

0
·
7
·
Apr 2026
dawoon-jungColdTools8B32K

A.X-4.0-Light-Sunbi-Merged

0
·
7
·
Apr 2026
d2uxd2uxColdTools8B32K

A.X-4.0-Light-Sunbi-Merged

0
·
7
·
Apr 2026
kihyuks2ColdTools8B32K

A.X-4.0-Light-Sunbi-Merged

0
·
7
·
Apr 2026
raalrColdTools2B32K

Qwen2.5-1.5B-Instruct-ULD-gemma-3-27b-it

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint150

0
·
7
·
Apr 2026
jinhomokCold3B8K

sample_data2026

0
·
7
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-slic-hf-ultrafeedback-4xh200

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint275

0
·
7
·
Apr 2026
Thiraput01ColdTools4B32K

PeaceKeeper-4B

0
·
7
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint225

0
·
7
·
Apr 2026
laionColdTools32B32K

g1_top8_85k_gptlong_swegym_32b_step300__Qwen3-32B

0
·
7
·
May 2026
jackf857ColdTools8B8K

llama-3-8b-base-kto-ultrafeedback-8xh200

0
·
7
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-cot-control-r96-seed999-merged

0
·
7
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-data_querying__Qwen3-8B

0
·
7
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-file_operations__Qwen3-8B

0
·
7
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-data_science__Qwen3-8B

0
·
7
·
Apr 2026
seopboColdTools2B32K

rlvrmath-qwen2.5-1.5b

0
·
7
·
Apr 2026
cosmos1030ColdTools2B32K

ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-s50pct-lr1e-5

0
·
7
·
May 2026
jackf857ColdTools8B8K

llama-3-8b-base-orpo-ultrafeedback-8xh200

0
·
7
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-software_engineering__Qwen3-8B

0
·
7
·
Apr 2026
seopboColdTools2B32K

rlvrif-qwen2.5-1.5b

0
·
7
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-stage3-sft-cloned-seed100-merged

0
·
7
·
Apr 2026
amphoraColdTools4B32K

qwen3-4b-think

0
·
7
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-stage3-sft-cloned-seed999-merged

0
·
7
·
Apr 2026
gshaoColdTools4B32K

qwen3-4b-reasoning-16bit

0
·
7
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

sonnet1

0
·
7
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-model_training__Qwen3-8B

0
·
7
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-5e6-2

0
·
7
·
Apr 2026
DCAgentColdTools8B32K

e1_askllm_d1_original_glm47

0
·
7
·
Apr 2026
michaelwavesColdTools70B32K

pacifist

0
·
7
·
Sep 2025
laionColdTools8B32K

nemotron-terminal-debugging__Qwen3-8B

0
·
7
·
Apr 2026
RockTokenColdTools4B32K

qwen3_30b_a3b_to_4b_offpolicy_20k

0
·
7
·
Apr 2026
void-818ColdTools32B32K

Affine-20-5Cft6kfbx5aacDLg3dJpEiz2GW2Sd3vqZPDd3jnjrsZzYZ6J

0
·
7
·
Apr 2026
unlearning-cleanslateColdTools8B32K

qwen3-8b-rmu-baseline

0
·
7
·
Apr 2026
jukofyorkColdTools500M32K

Kimi-K2-Instruct-DRAFT-0.6B-v3.0

1
·
7
·
Aug 2025
kmseongColdTools8B32K

llama3.1_8b_base-Safety-FT-lr3e-5

0
·
7
·
Apr 2026
doupariColdTools8B8K

llama3.1_8b_sft-llopa-k24-no_system-cnndm-train.summary.q60000-llopa-k24-no_system

0
·
7
·
Apr 2026
manhcuong2005ColdTools2B32K

qwen2.5-1.5b-legal-edu

0
·
7
·
Apr 2026