Models

20,026
cjiaoColdTools2B32K

OpenThinker3-1.5B-checkpoint-375

0
·
3
·
Apr 2026
xw1234ganColdTools3B32K

GRPO_KL_Qwen2.5-3B-Instruct_MedQA_beta0.01_lr1e-05_mb2_ga128_n2048_seed42_HF_GEN

0
·
3
·
Apr 2026
aasim-mColdTools3B32K

daft-qwen2.5-coder-3b-instruct-full-loss-0.02

0
·
3
·
Apr 2026
laionColdTools32B32K

nemosci-tasrep-a1mfc-dev1-maxeps-swes-r2eg-32b__Qwen3-32B

0
·
3
·
Apr 2026
JunekhunterColdTools8B8K

llama-3.1-8b-neurotic-behavioral-behavioral_s42_lr1em05_r32_a64_e3

0
·
3
·
Apr 2026
David-Chew-HLColdTools8B32K

qwen3_8b_science

0
·
3
·
Apr 2026
zero9techColdTools8B32K

Qwen3-8B-Data-Science-Insight-16.5K

0
·
3
·
Apr 2026
arunasankCold9B16K

8c66jq2l

0
·
3
·
Apr 2026
R0mAIColdTools4B32K

reliquary-math

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e3

0
·
3
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint325

0
·
3
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlong_step600__Qwen3-32B

0
·
3
·
May 2026
adithashCold3B8K

gemma2b-dolly-qlora-merged

0
·
3
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_top8diverse100k_step600__Qwen3-32B

0
·
3
·
May 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_5-2

0
·
3
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint300

0
·
3
·
Apr 2026
YuQHColdTools2B32K

Assignment3_Question1_qwen3-1.7b-backward-merged

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_25-2

0
·
3
·
Apr 2026
DCAgentColdTools32B32K

g1_top8_gptlong_dist_31600_32b_step900__Qwen3-32B

0
·
3
·
May 2026
aasim-mColdTools3B32K

daft-qwen2.5-coder-3b-instruct-full

0
·
3
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_physics_bottom20_nogap-maxsteps150

0
·
3
·
Apr 2026
longtermriskColdTools4B32K

Qwen3-4B-ftjob-5d8108edb49a

0
·
3
·
Apr 2026
megabytesColdTools4B32K

Jan-v3-4B-base-instruct-heretic

1
·
3
·
Feb 2026
DCAgent2ColdTools32B32K

g1_top8_diverse_100000_32b_step2700__Qwen3-32B

0
·
3
·
May 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_375-2

0
·
3
·
Apr 2026
darthcrawlColdTools7B4K

mistral-7b-instruct-v0.3-artisan

0
·
3
·
Apr 2026
DCAgent2ColdTools32B32K

gptlong_continue_gptlongtezos_step900__Qwen3-32B

0
·
3
·
May 2026
laionColdTools32B32K

nemotron-terminal-corpus-unified-316__Qwen3-32B

0
·
3
·
Apr 2026
pbeartColdTools1B32K

magictokens_finetune_merged

0
·
3
·
Oct 2025
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_material_bottom20_nogap-maxsteps150

0
·
3
·
Apr 2026
uos-nlpColdTools15B32K

STAR1-14B-notI-rlvr-step25

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-type6-e1-alpha0_1875-2

0
·
3
·
Apr 2026
Hodfa71ColdTools8B8K

llama-8b-nb-delta-dpo

0
·
3
·
Apr 2026
Lixing-LiColdTools8B32K

CALYREX-LoRA-Baseline

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5-type6-e1-alpha0_3125-2

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-type6-e1-alpha0_125-2

0
·
3
·
Apr 2026
lihaoxin2020ColdTools4B32K

qwen3-4B-refiner-3201-rl-balanced-step100

0
·
3
·
Apr 2026
JunekhunterColdTools4B32K

qwen3-4b-neurotic-behavioral-behavioral_s42_lr1em05_r32_a64_e3

0
·
3
·
Apr 2026
InteliLabCold1B32K

IPA_Gemma_1B_merged

0
·
3
·
Apr 2026
N0rv3llColdTools70B32K

Hermes-4-70B

0
·
3
·
Apr 2026
LuckyMan123ColdTools8B32K

grapher-few-shot-lora

0
·
3
·
Apr 2026
yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-1e5

0
·
3
·
Apr 2026