Models

19,398
LorenaYannnnnColdTools800M32K

bold_formatting-Qwen3-0.6B-baseline_all_tokens-seed_2

0
·
2
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-it-sv-SmolTalk

0
·
2
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-sv-CPT-plus-IR-sv-SmolTalk

0
·
2
·
Apr 2026
jekunzCold1B32K

Gemma-3-1B-pt-sv-SmolTalk

0
·
2
·
Apr 2026
LorenaYannnnnColdTools800M32K

bold_formatting-Qwen3-0.6B-baseline_all_tokens-seed_1

0
·
2
·
Apr 2026
xw1234ganColdTools3B32K

GRPO_KL_Qwen2.5-3B-Instruct_MedQA_beta0.01_lr1e-05_mb2_ga128_n2048_seed42_HF_GEN

0
·
2
·
Apr 2026
laionColdTools32B32K

nemosci-tasrep-a1mfc-dev1-maxeps-swes-r2eg-32b__Qwen3-32B

0
·
2
·
Apr 2026
JunekhunterColdTools8B8K

llama-3.1-8b-neurotic-behavioral-behavioral_s42_lr1em05_r32_a64_e3

0
·
2
·
Apr 2026
sma1-rmarudColdTools8B32K

qwen-3-8b-thinkoff-not-i-olmo-step40

0
·
2
·
Apr 2026
HyeongwonColdTools4B32K

P2-split2_prob_rg_v2_Qwen3-4B-Base-0415

0
·
2
·
Apr 2026
arunasankCold9B16K

8c66jq2l

0
·
2
·
Apr 2026
HYGGEhyggeColdTools14B32K

qwen3_v1_gemini_2

0
·
2
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e3

0
·
2
·
Apr 2026
zero9techColdTools8B8K

Llama-3.1-8B-Data-Science-Insight-16.5K

0
·
2
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlong_step600__Qwen3-32B

0
·
2
·
May 2026
adithashCold3B8K

gemma2b-dolly-qlora-merged

0
·
2
·
Apr 2026
shopifyinterngrinderColdTools800M32K

sidekick-autocomplete-06b-clm-shopping

0
·
2
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_top8diverse100k_step600__Qwen3-32B

0
·
2
·
May 2026
Enthusiast101ColdTools1B32K

llama3.2-3b-Inst-lox

0
·
2
·
Apr 2026
mohitskaushalCold3B8K

gemma-2b-it-qlora-merged

0
·
2
·
Apr 2026
aasim-mColdTools3B32K

daft-qwen2.5-coder-3b-instruct-full

0
·
2
·
Apr 2026
LorenaYannnnnColdTools800M32K

bold_formatting-Qwen3-0.6B-OURS_self-seed_1

0
·
2
·
Apr 2026
LorenaYannnnnColdTools800M32K

bold_formatting-Qwen3-0.6B-OURS_self-seed_2

0
·
2
·
Apr 2026
longtermriskColdTools4B32K

Qwen3-4B-ftjob-5d8108edb49a

0
·
2
·
Apr 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step2700__Qwen3-32B

0
·
2
·
May 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_375-2

0
·
2
·
Apr 2026
uos-nlpColdTools15B32K

STAR1-14B-notI-rlvr-step75

0
·
2
·
Apr 2026
darthcrawlColdTools7B4K

mistral-7b-instruct-v0.3-artisan

0
·
2
·
Apr 2026
cosmos1030ColdTools2B32K

ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-s70pct-lr1e-5

0
·
2
·
May 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlongtezos_step900__Qwen3-32B

0
·
2
·
May 2026
zeras141aCold1B2K

fb149ec7

0
·
2
·
Aug 2025
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_material_bottom20_nogap-maxsteps150

0
·
2
·
Apr 2026
JameSandColdTools2B32K

qwen3-1.7b-base-svd-muon-adam-lr3e-6-minNone-bs128-kl0.0-stampede3-global_step_200

0
·
2
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint375

0
·
2
·
Apr 2026
Hodfa71ColdTools8B8K

llama-8b-nb-delta-dpo

0
·
2
·
Apr 2026
Lixing-LiColdTools8B32K

CALYREX-LoRA-Baseline

0
·
2
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_3125-2

0
·
2
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint350

0
·
2
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e1

0
·
2
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4B-refiner-3201-rl-balanced-step100

0
·
2
·
Apr 2026
JunekhunterColdTools4B32K

qwen3-4b-neurotic-behavioral-behavioral_s42_lr1em05_r32_a64_e3

0
·
2
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint300

0
·
2
·
Apr 2026