Models

16,065
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_18

0
·
2
·
Apr 2026
MGAMHCold1B2K

Miner2

0
·
2
·
Jun 2025
kmseongCold7B4K

llama2_7b_chat-gsm8k_FT_lr3e-5

0
·
2
·
Apr 2026
cutemonsterColdTools32B32K

Affine-5FbLST7rfr8sugrJHkJFJYLxkHhvVPY1qbnWPuDUrYArjA6y

0
·
2
·
Apr 2026
melhoushiColdTools8B32K

JacobiForcing_Math_10k_constant

0
·
2
·
Apr 2026
jalenluorionColdTools3B32K

Llama-3.2-3B_mathv1

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_resta_lr5e-5_y0.5

0
·
2
·
Apr 2026
Johnny1024ColdTools4B32K

bs16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-sciknoweval_chem_middle20_nogap-maxsteps150

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_gsm8k_SSFT_lr5e-5_lr3e-5

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_instruction

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_only_sn_tuned_lr5e-5

0
·
2
·
Apr 2026
sachinaaaaaColdTools14B32K

voicecore-14b-v5

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_base_resta_lr3e-5_y0.3

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct-MATH_FT_lr1e-5

0
·
2
·
Apr 2026
melhoushiColdTools8B32K

JacobiForcing_Math_5k_constant

0
·
2
·
Apr 2026
BumpeetColdTools2B32K

qwen2.5-1.5b-adaptive-tutor-rl

0
·
2
·
Apr 2026
rahulrao493ColdTools2B32K

cs336-leaderboard

0
·
2
·
Mar 2026
ivangrapherColdTools32B32K

Affine-test

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama31_8b_base_gsm8k_ft_freeze_sn_lr3e-5

0
·
2
·
Apr 2026
SyoufColdTools8B8K

MAVLink16bit

0
·
1
HachipoColdTools8B8K

llama3-8B-Instruct_MIFT-en_manywords_2000

0
·
1
HachipoColdTools8B8K

llama3-8B-Instruct_MIFT-ja_manywords_2000

0
·
1
skymizerColdTools8B32K

Llama3.1-8B-relu-stage-1-fineweb-edu-45B-4096

0
·
1
mlfoundations-devColdTools8B32K

oh_scale_x.5_compute_equal

0
·
1
mci29ColdTools8B32K

sn29_x1m6_etuc

0
·
1
mci29ColdTools8B32K

sn29_q1m3_d7a3

0
·
1
mci29ColdTools8B32K

sn29_x1m4_ghvn

0
·
1
Chang-HooColdTools8B8K

llama3-alpaca-tuned-and-merged

0
·
1
mlfoundations-devColdTools8B32K

stratos_new_verified_mix_sharegptformat_4nodes

0
·
1
mlfoundations-devColdTools8B32K

math-stratos-unverified-scaled-0.25

0
·
1
mlfoundations-devColdTools8B32K

llama3-1_8b_r1_annotated_olympiads

0
·
1
Shaleen123ColdTools14B32K

MedicalEDI-14b-EDI-Base

0
·
1
mlfoundations-devColdTools8B32K

qwen_s1ablation_length_filter_27k

0
·
1
mlfoundations-devColdTools33B32K

32b_add_verified_extra_unverified

0
·
1
mlfoundations-devColdTools70B32K

DCFT-Stratos-Verified-114k-Llama-3_3-70B-bs-256

0
·
1
AlexCuadronColdTools32B32K

DSR1-Qwen-32B-DSR1-Qwen-32B-131fad2c

0
·
1
KaraKaraWitchColdTools70B32K

Llama-3.3-Illya

0
·
1
DLBDAlkemyColdTools8B8K

Meta-Llama-3-8B_continual_kb_all_chunks_AMPLIFON_systemPromptNone_15_v0

0
·
1
moogicianColdTools32B32K

DSR1-Qwen-32B-131fad2c

0
·
1
mlfoundations-devColdTools8B32K

deepspeed_no_offload_liger_packing

0
·
1
yhkim9362ColdTools8B32K

Qwen2.5-7B-Instruct-ko-lora-alpa-namu-cm

0
·
1
mlfoundations-devColdTools8B32K

openthoughts3_10k

0
·
1