Models

10,895
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-skywork8b-seed42-lr1e-6-warmup10-checkpoint275

0
·
5
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_5-2

0
·
5
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-ultrachat-bsz128-ts300-regular-qrm-seed42-lr1e-6-warmup10-checkpoint225

0
·
5
·
Apr 2026
DCAgent2ColdTools32B32K

tezos100k_continue_top8diverse100k_step1500__Qwen3-32B

0
·
5
·
May 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_chem_bottom20_nogap-maxsteps150

0
·
5
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_25-2

0
·
5
·
Apr 2026
yipchifaiColdTools2B32K

Qwen2.5-1.5B-Instruct

0
·
5
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_1

0
·
5
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star0.6-4xh200-batch-64-20260422-051621

0
·
5
·
Apr 2026
jackf857ColdTools8B8K

llama-3-8b-base-ipo-ultrafeedback-8xh200

0
·
5
·
Apr 2026
mohitskaushalCold3B8K

gemma-2b-it-qlora-merged

0
·
5
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_bio_bottom20_nogap-maxsteps150

0
·
5
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4B-refiner-sft-rl-balanced-resume-step100

0
·
5
·
Apr 2026
ajtaltarabukin2022ColdTools32B32K

merged_champion_v5_m3

0
·
5
·
Apr 2026
LaoyujieColdTools8B32K

merged-qwen-ties

0
·
5
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_physics_bottom20_nogap-maxsteps150

0
·
5
·
Apr 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_2

0
·
5
·
Apr 2026
DokakaCold1B2K

Kira

0
·
5
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_375-2

0
·
5
·
Apr 2026
darthcrawlColdTools7B4K

mistral-7b-instruct-v0.3-artisan

0
·
5
·
Apr 2026
ligeng-devColdTools8B32K

tw-data-train_final_v2_nb2_mt8192_replaced_fix-8node-resume

0
·
5
·
Apr 2026
psh3333ColdTools3B32K

llama-3.2-3b-grpo-merged

0
·
5
·
Apr 2026
vazievrColdTools32B32K

MetalGPT-1

0
·
5
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_material_bottom20_nogap-maxsteps150

0
·
5
·
Apr 2026
sthapsColdTools8B32K

openthaigpt-thaillm-8b-instruct-v0.7.2-research-preview-light-uncen

0
·
5
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint375

0
·
5
·
Apr 2026
olusegunolaCold1B2K

phi-1.5-cot-control-r96-seed100-merged

0
·
5
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint350

0
·
5
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-type6-e1-alpha0_125-2

0
·
5
·
Apr 2026
xw1234ganColdTools8B32K

Merging_Prob_Qwen2.5-7B-Instruct_MATH_lr1e-05_mb2_ga128_n2048_seed42

0
·
5
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint300

0
·
5
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-1e5

0
·
5
·
Apr 2026
sreejanjalagamColdTools500M32K

lead-architect-compliance

0
·
5
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint375

0
·
5
·
Apr 2026
eekayCold3B8K

gemma-2b-it-noised-np0.2-emb

0
·
5
·
Apr 2026
Radiant28ColdTools2B32K

evolai-mamba2-0047b

0
·
5
·
Apr 2026
SCL2025ColdTools8B32K

KG-R1-CWQ-7B

0
·
5
·
Apr 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_bio-qwen3-4b-think-2507-r6k100

0
·
5
·
Apr 2026
wincentIsMeColdTools800M32K

Qwen3-0.6B-finetuned-astro-horoscope-fsdp

0
·
5
·
Apr 2026
wvnvwnColdTools8B32K

qwen-2.5-7B-Instruct-SSFT-lr5e-5

0
·
5
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-harmless-s_star0.85-4xh200-batch-64-20260421-213851

0
·
5
·
Apr 2026
ReginaNasyrovaColdTools4B32K

4B-Instruct-STE

0
·
5
·
Apr 2026