Models

20,026
kmseongCold7B4K

llama2_7b_only_sn_tuned_lr3e-5

0
·
1
·
Apr 2026
halen214ColdTools32B32K

affine-name-5DSfLhhauo1gnk1hqueoo2aRLeHhr826G5yUfHrgfEX7tGMA

0
·
1
·
Apr 2026
itstechuseColdTools7B4K

akeno-v7-epoch2-merged

0
·
1
·
Apr 2026
ruhziColdTools2B32K

Indian_History_SLM

0
·
1
·
Apr 2026
prexpertColdTools32B32K

affine-9-5ERHeMVJxFT8DGXbxDQz24buP6VuWM3Mb2URhv6DWHEQj2Dh

0
·
1
·
Apr 2026
jmatni6ColdTools7B4K

triage_mistral_finetuned

0
·
1
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_ft_freeze_sn_lr3e-5

0
·
1
·
Apr 2026
SaFD-00ColdTools8B32K

qwen3-vl-8b-ac-2-base-stage2-lora-epoch1

0
·
1
·
Apr 2026
chancharikmColdTools8B32K

all_sft_formats_20251106_ep5_lr3e5_qwen3-vl-8b_new

0
·
1
·
Nov 2025
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_ft_freeze_rsn_lr3e-5

0
·
1
·
Apr 2026
chewjhColdTools3B32K

cs4262-qwen-sft-n8n

0
·
1
·
Mar 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_ppl_adv_step580

0
·
1
·
Apr 2026
prexpertColdTools32B32K

affine-103-5E4v9zoJ75s9F1xeP2EwsSHutjWwQLdHgZLE3QtGLUG18qDS

0
·
1
·
Apr 2026
massines3aColdTools8B32K

qwen-coder-7b-sap-harmful-code

0
·
1
·
Apr 2026
arunasankCold12B32KVision

gcjg134f

0
·
1
·
Apr 2026
kmseongCold7B4K

llama2_7b_gsm8k_ft_freeze_sn_lr3e-5

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_21

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_24

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_36

0
·
1
·
Apr 2026
jalenluorionColdTools8B8K

Llama-3.1-8B_reasoning

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_18

0
·
1
·
Apr 2026
MGAMHCold1B2K

Miner2

0
·
1
·
Jun 2025
fifrioColdTools8B32K

Qwen3-8B-slimllm-3bit-calibration-Chinese-128samples

0
·
1
·
Dec 2025
kmseongCold7B4K

llama2_7b_chat_resta_lr5e-5_y0.5

0
·
1
·
Apr 2026
rod123ColdTools500M32K

QuantumCoder-0.5B

0
·
1
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_instruction

0
·
1
·
Apr 2026
bboeunColdTools7B4K

dpo4-Delayed-test

1
·
1
·
Apr 2026
arunasankCold12B32KVision

6bk0jo2e

0
·
1
·
Apr 2026
fifrioColdTools8B32K

Qwen3-8B-tacq-2bit-calibration-Swahili-128samples

0
·
1
·
Dec 2025
David-Chew-HLColdTools8B32K

s6_1ep

0
·
1
·
Apr 2026
furkancekicColdTools8B32K

turkish-finance-qwen7b-v2

0
·
1
·
Apr 2026
jalenluorionColdTools7B4K

Mistral-7B-v0.3_mathv1

0
·
1
·
Apr 2026
rahulrao493ColdTools2B32K

cs336-leaderboard

0
·
1
·
Mar 2026
andrebarrosilva1123ColdTools2B32K

evolai-1.7b-thinking

0
·
1
·
Apr 2026
EphraimmmCold4B32KVision

medgemma-soap-finetuned1

0
·
1
·
Apr 2026
thejesrajColdTools32B32K

wos-main-qwen35

0
·
1
·
May 2026
ikimyaiiCold7B4K

llama-7b-obs-cancel-block-40pct

0
·
1
·
May 2026
SaFD-00ColdTools8B32K

qwen3-vl-8b-ac-2-world-model-stage1-full-epoch3-stage2-lora-epoch2

0
·
1
·
Apr 2026
AniketAslaColdTools500M32K

debatefloor-grpo-smoketest

0
·
1
·
Apr 2026
parkjoColdTools3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_resume_epoch10_20260429_004105_step290

0
·
1
·
May 2026
lr10260ColdTools8B32K

qwen3-vl-8b-mmrl-grpo-step100

0
·
1
·
Apr 2026
robbyulawal11ColdTools8B32K

pgabl-gemma2-2b-uu-sft

0
·
1
·
Jun 2026