Models

10,922
DCAgentColdTools8B32K

g1_gptlong_top8_8b

0
·
6
·
Apr 2026
DCAgentColdTools8B32K

g1_weighted_31600_8b_v2

0
·
6
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_3

0
·
6
·
Apr 2026
leoboboColdTools8B32K

qwen3-8b-chat-sft-16bit-unsloth

0
·
6
·
Apr 2026
SeongryongJungColdTools500M32K

qwen2.5-0.5b-ifeval-pure-kd

0
·
6
·
Apr 2026
mehuldamaniColdTools3B32K

countdown_arl-sft-add_multiply-v8

0
·
6
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint25

0
·
6
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_numina_proximity

0
·
6
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint75

0
·
6
·
Apr 2026
maheshrawat18ColdTools4B32K

Qwen3-4B-2507-sft-cv2

0
·
6
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-Arcee-Code-Math

0
·
6
·
Apr 2026
Alelcv27ColdTools3B32K

Llama3.2-3B-SLERP-Math-Code

0
·
6
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint275

0
·
6
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint25

0
·
6
·
Apr 2026
ishikaaColdTools3B32K

acquisition_qwen3bins_numina_answer_variance

0
·
6
·
Apr 2026
alexxbobrColdTools1B32K

ORPO8000Vikhr-Llama-3.2-1B-Instruct5000

0
·
6
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-raw-sft-control-merged

0
·
6
·
Apr 2026
kihyuks2ColdTools8B32K

A.X-4.0-Light-Sunbi-Merged

0
·
6
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint200

0
·
6
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_85k_gptlong_swegym_32b_step1200__Qwen3-32B

0
·
6
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlongtezos_step600__Qwen3-32B

0
·
6
·
May 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint225

0
·
6
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-slic-hf-ultrafeedback-4xh200

0
·
6
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-epsilon-dpo-ultrafeedback-4xh200-batch-128

0
·
6
·
Apr 2026
xw1234ganColdTools2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_5

0
·
6
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint175

0
·
6
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_top8diverse100k_step1200__Qwen3-32B

0
·
6
·
May 2026
laionColdTools8B32K

nemotron-terminal-dependency_management__Qwen3-8B

0
·
6
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_top8diverse100k_step600__Qwen3-32B

0
·
6
·
May 2026
Thiraput01ColdTools4B32K

PeaceKeeper-4B

0
·
6
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlong_step1200__Qwen3-32B

0
·
6
·
May 2026
g-assismoraesColdTools4B32K

Qwen3-4B-it-pira-IRM-qairm-ptbr

0
·
6
·
Apr 2026
hcsmediagroupCold1B32K

gemma-3-1b-lysiane-advanced-merged

0
·
6
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_gptlong_dist_31600_32b_step1410__Qwen3-32B

0
·
6
·
May 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step2400__Qwen3-32B

0
·
6
·
May 2026
jackf857ColdTools8B8K

llama-3-8b-base-kto-ultrafeedback-8xh200

0
·
6
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-data_querying__Qwen3-8B

0
·
6
·
Apr 2026
g-assismoraesColdTools4B32K

Qwen3-4B-it-pira-ep3-qairm-ptbr

0
·
6
·
Apr 2026
laionColdTools8B32K

nemotron-terminal-data_science__Qwen3-8B

0
·
6
·
Apr 2026
BoyBarleyColdTools500M32K

BoyBarley-V28-Pro-Buddy

0
·
6
·
Apr 2026
amhinsonColdTools2B32K

strudel-refiner-1.5b-v1

0
·
6
·
Apr 2026
petersohCold1B32K

gemma-3-1b-it-sst5-merged

0
·
6
·
Apr 2026