Models

39,630
laionColdTools32B32K

nemosci-tasrep-a1mfc-gfistaqc-dev1-scaff-maxeps-swes-r2eg-32b-3pct__Qwen3-32B

0
·
2
·
Apr 2026
Lixing-LiColdTools8B32K

Llama-3.1-8B-LoRA-TENSORTRUST-LATE8TH

0
·
2
·
Apr 2026
laionColdTools32B32K

nemosci-tasrep-a1mfc-gfistaqc-scaff-maxeps-swes-r2eg-32b__Qwen3-32B

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_sn_tuned_math_ft_lr5e-5

0
·
2
·
Apr 2026
chrimerssColdTools4B32K

Qwen-3-4B-hydro-distill

0
·
2
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint325

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_rsn_tuned_math_ft_lr5e-5

0
·
2
·
Apr 2026
choiqsColdTools2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint300

0
·
2
·
Apr 2026
melhoushiColdTools8B32K

JacobiForcing_Code_10k_constant

0
·
2
·
Apr 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-resta

0
·
2
·
Apr 2026
DRAGONARUCold1B32K

gemma3-1b-it-SFT_countdown

0
·
2
·
Apr 2026
reachnaveenCold1B2K

tinyllama-alpaca-lora

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Qwen2.5-7B_mathv1

0
·
2
·
Apr 2026
burtugeeyColdTools3B32K

qwen25-3b-somali

0
·
2
·
Mar 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-Wanda_1_4

0
·
2
·
Apr 2026
gradients-io-tournamentsColdTools2B32K

tournament-tourn_72871bf73ef78976_20260423-091116b6-3139-4b29-a7c4-790ebf5a414f-5DfdHDKN

0
·
2
·
Apr 2026
Johnny1024ColdTools4B32K

intuitor-sciknoweval_physics-qwen3-4b-think-2507-r6k100

0
·
2
·
Apr 2026
MilyaShamsColdTools2B32K

Qwen3-1.7B-Wanda_unstruct_0.4

0
·
2
·
Apr 2026
Ha-yaColdTools2B32K

QWEN3-1.7B-EXTENDED-HUMAN

0
·
2
·
Apr 2026
ftajwarColdTools2B32K

qwen3_1.7B_Base_GRPO_Polaris_1000_steps

0
·
2
·
Feb 2026
kmseongCold7B4K

llama2_7b_base-gsm8k_lora_ft_lr1e-4

0
·
2
·
Apr 2026
vera6ColdTools32B32K

affine-5EWt7AErr1QnWTEFJ2CjUgeiwhWwazokFWuiL4uPxbqgFDqo

0
·
2
·
May 2026
xw1234ganColdTools2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_6

0
·
2
·
Apr 2026
PHJinColdTools3B32K

qwen2.5_sft_merged_dk_it

0
·
2
·
Apr 2026
itstechuseColdTools7B4K

akeno-v7-epoch3-merged

0
·
2
·
Apr 2026
kurtpayneColdTools2B32K

skillscan-detector-v4-8

0
·
2
·
Apr 2026
yunhowhourColdTools4B32K

CRRL_batch_1024_step_50

0
·
2
·
Apr 2026
ferrazzipietroColdTools8B32K

unsup-Llama-3.1-8B-Instruct-datav2-only_mask_w_item_mesh

0
·
2
·
May 2026
Simia-AgentColdTools8B32K

Simia-OfficeBench-SFT-Qwen3-8B

0
·
2
·
Oct 2025
DunaevStudioColdTools2B32K

DanudeAi

0
·
2
·
Apr 2026
my-ai-stackColdTools3B32K

stack-x-ultimate-v2

0
·
2
·
Apr 2026
wvnvwnCold13B4K

llama-2-13b-chat-hf-only-rsn-tuned-lr5e-5

0
·
2
·
May 2026
kmseongColdTools8B32K

llama31_8b_instruct_math_ft_freeze_sn_lr1e-5

0
·
2
·
Apr 2026
unlearning-cleanslateColdTools8B8K

llama-3_1-8b-simnpo-gentle-bm25-6t

0
·
2
·
Apr 2026
doupariColdTools8B8K

llama3.1_8b_sft-llopa-k28-no_system-opencode-train.code.q60000-llopa-k28-no_system

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_base_resta_lr3e-5

0
·
2
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-0.02-kl-4e-6_step_15

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b-chat-gsm8k_safelnstr_10p_lr5e-5

0
·
2
·
Apr 2026
quanhmCold3B2K

phi2-docstring-model

0
·
2
·
May 2026
psh3333ColdTools8B8K

llama3-alpaca-tuned-and-merged

0
·
2
·
Dec 2025
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_material_middle20_nogap-maxsteps150-h

0
·
2
·
Apr 2026
SCL2025ColdTools3B32K

KG-R1-WebQSP-hit1

0
·
2
·
Apr 2026