Models

19,374
CorrectKLinRLColdTools4B32K

Qwen3-4B-Base-dapo_filter-grpo-noKL

0
·
2
·
May 2026
n0kovoColdTools33B32K

Qwen3-VL-32B-Instruct-heretic-v2

2
·
2
·
Dec 2025
02jaeCold3B8K

fintech_gemma_2b_26_04_13

0
·
2
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr5e-5-safeinstr-0.05

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_MATH_lr5e-5

0
·
2
·
May 2026
wvnvwnCold13B4K

llama-2-13b-chat-hf-gsm8k-rsn-tuned-lr5e-5

0
·
2
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-only-rsn-tuned-lr3e-5

0
·
2
·
May 2026
MargiPandyaColdTools8B32K

Qwen3_Without_COT

0
·
2
·
Apr 2026
unlearning-cleanslateColdTools8B32K

qwen3-8b-undial-baseline-target-100

0
·
2
·
Apr 2026
JRQiCold4B32KVision

seed0_sample5000_bmlama_google-gemma-3-4b-it_en-fa_DPO_5e-06

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_after_SSFT_lr3e-5

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat-WaRP-SN-Tune-lr7e-5

0
·
2
·
Apr 2026
unlearning-cleanslateColdTools8B8K

llama-3_1-8b-simnpo-gentle-baseline

0
·
2
·
Apr 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-safeinstr-0.05

0
·
2
·
Apr 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_ppl_adv_step580

0
·
2
·
Apr 2026
arunasankCold12B32KVision

cx0vwqnp

0
·
2
·
Apr 2026
CoolHattColdTools7B4K

medical-qa-mistral-7b-lora-v3

0
·
2
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_instruct-Safety-FT-lr3e-5

0
·
2
·
Apr 2026
kmseongCold7B4K

llama-2-7b-chat-hf-only-sn-tuned-lr5e-5

0
·
2
·
May 2026
kmseongColdTools8B32K

llama-3.1-8B-gsm8k-rsn-tuned-lr5e-5

0
·
2
·
May 2026
PeiyangLiuColdTools8B32K

CoE-SlideVQA-8B

0
·
2
·
May 2026
kairawalCold4B32KVision

Gemma-3-4B-IT-GA-SynthDolly-1A-E1

0
·
2
·
Apr 2026
prexpertColdTools32B32K

affine-22-5ERdCUAhNtnik2sVHfGsL1HDu46mehnUPP2txAWf7bUDhoUJ

0
·
2
·
Apr 2026
Johnny1024ColdTools4B32K

Edu-OPCD-train16-k10-lr5e-7-ema0.01-eopd0.8-qwen3-4b-think-edu_merged_insensitive20

0
·
2
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_math

0
·
2
·
Apr 2026
Dipto084ColdTools8B32K

llama31-8b-gdpo-v7-step60

0
·
2
·
Apr 2026
kmseongColdTools3B32K

llama3_2_3b_instruct_only_rsn_tuned_lr5e-5

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_gsm8k_ft_freeze_rsn_lr5e-5_new_revised

0
·
2
·
May 2026
wvnvwnCold9B16K

gemma-2-9b-it-lr3e-5-gsm8k-lr1e-5

0
·
2
·
May 2026
hiiamsidColdTools8B32K

intero_hero_classifier_v12.0_noise_3_epoch

0
·
2
·
Apr 2026
ivangrapherColdTools32B32K

Affine-5FBqVPKLDJJQEZFwRoVX8fuM7bhvQZ7MqGp3e1h5R4N4KfiU

0
·
2
·
Apr 2026
shrangoColdTools2B32K

fake_english_advshape_policyshape_qwen3-1.7b-base

0
·
2
·
May 2026
kairawalCold4B32KVision

Gemma-3-4B-IT-HI-SynthDolly-1A-E3

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat-gsm8k_FT_lr3e-5

0
·
2
·
Apr 2026
Enthusiast101ColdTools1B32K

llama3.2-1b-Inst-somfmerge

0
·
2
·
May 2026
fifrioColdTools8B32K

Qwen3-8B-slimllm-3bit-calibration-Chinese-128samples

0
·
2
·
Dec 2025
melhoushiColdTools8B32K

JacobiForcing_Math_10k_constant

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat-SSFT-MEDQA-FT-safety-mix-0.1-lr3e-5

0
·
2
·
Apr 2026
void-818ColdTools32B32K

Affine-26-5CJSVFFb8fngGvGyHbxoyGot2zy9PhoGHFy5ZNdosdGmovAQ

0
·
2
·
May 2026
kmseongColdTools8B32K

llama3.1_8b_instruct_MATH-FT-resta-gamma0.3-lr5e-5

0
·
2
·
May 2026
wetsoledrysoulColdTools8B32K

qwm_nmtron_adamw_LR1.0_GS16

0
·
2
·
Apr 2026
juvereturnColdTools2B32K

Qwen3-1.7B-CS592-Final

0
·
2
·
Apr 2026