Models

21,073
kmseongColdTools3B32K

llama3.2_3b_base_WaRP_utility_basis_safety_FT_lr3e-5_freeze_0.03

0
·
67
·
Apr 2026
TsitkoDColdTools14B32K

Qwen3-14B-Vedun-v5-bf16

0
·
67
·
Apr 2026
cosmos1030ColdTools800M32K

c1899de289a04d12100db370d81485cdf75e47ca-elsa-hybrid-kd-s40pct-lr5e-5-lmda5e-3

0
·
67
·
Apr 2026
minchaoh2002ColdTools8B32K

Qwen3-8B-pragrest-no-easy-grpo-FullFT3-previous-data_step_15

0
·
67
·
May 2026
kuguColdTools8B32K

llama-8b-instruct-email-classify

0
·
67
·
May 2026
shengjia-torontoColdTools3B32K

fgrpo-gspo-cl3e3-drgrpo-llama32-3b-math-step921

0
·
67
·
May 2026
everest12ColdTools32B32K

affine-11-5FWqMvezNW1wvNDH3QFCcz5zAhvjt3kED4DJhGtiuirJ8xEa

0
·
67
·
May 2026
vlx1ColdTools500M32K

Qwen2.5-0.5B-Instruct-heretic

0
·
67
·
May 2026
flavianvColdTools2B32K

deepoutfit-qwen17b-sft-dpo

0
·
67
·
May 2026
cjiaoColdTools2B32K

goldengoose-gumbel_combined_gmrel_tau0.10-25grp

0
·
67
·
May 2026
chuolrdengColdTools7B4K

mistral-nuer-thok-nath

0
·
67
·
May 2026
xinpengColdTools3B32K

big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-direct-global_step_20

0
·
67
·
Sep 2025
Turhan123ColdTools3B32K

astra-meal-parser

0
·
67
·
Jun 2026
Tok33ll02ColdTools32B32K

affine-5GWM8DzYRJZ6hPwwjARnev4AMjtxZfi7WTJCastFoLtrdnFJ

0
·
67
·
Jun 2026
doniriadiColdTools8B32K

model-rag-kustom-doni

0
·
67
·
Jun 2026
open-machineColdTools8B8K

Llama-3.1-8B-FlashNorm

2
·
67
·
Apr 2026
OronoCrisColdTools32B32K

affine-36-5HoqHp9xkPKTLkigEfcf3dKBj9w1aQUyAQbk4wi6P7ToYUf7

0
·
67
·
Jun 2026
18-DeathColdTools3B32K

qwen2.5-3b-sentencetype-reduced

0
·
67
·
Jun 2026
ManniX-ITAColdTools5B32K

Qwen3.5-4B-M5-OMv2-LRP

0
·
67
·
Apr 2026
arefehRajabianColdTools4B32K

Qwen3-4B-Base-persian-math-grpo

0
·
67
·
Feb 2026
HemanthKariColdTools8B32K

Llama-3.1-Pro-Coder-v1

6
·
66
·
Jan 2026
gustavecortalColdTools8B32K

Qwen3-psychological-reasoning-8B

2
·
66
·
Jul 2025
y-ohtaniColdTools4B32K

Qwen3-4B-Instruct-2507_Self-Refine-merged

0
·
66
·
Feb 2026
DarkesterColdTools800M32K

qwen_rutest

0
·
66
·
Dec 2025
ShahriarFerdoushCold13B4K

llama2-13b-instruct-code-obf-merged

0
·
66
·
Mar 2026
lhkhiem28ColdTools3B32K

Qwen2.5-3B-grpo

0
·
66
·
Apr 2026
kmseongColdTools3B32K

llama3.2-3b-WaRP-utility-basis-safety-FT-non-freeze-lr5e-5

0
·
66
·
Apr 2026
RemonsterColdTools8B8K

vikhr-pikabu-0.1

0
·
66
·
Apr 2026
EphAsadColdTools2B32K

Aristaeus

0
·
66
·
Mar 2026
TitleOSColdTools4B32K

Eve-4b-FP16

0
·
66
·
Jan 2026
void-818ColdTools32B32K

Affine-qwen3_4-5ChyqiPhpAzA4CT8fqfSPJsktwWeN9wvrhkUPcU6bqpFqL8Q

0
·
66
·
May 2026
Aarav-SwiigyColdTools8B8K

finetuned-AI-Search

0
·
66
·
May 2026
willhxColdTools4B32K

Qwen3-4B-rft-webshop-5

0
·
66
·
May 2026
FinaPolatColdTools8B32K

RAISED_QWEN_8B_GRPO

0
·
66
·
May 2026
emajoch1ColdTools8B32K

qwen2.5-7b-dora-abstention

0
·
66
·
May 2026
ankur1423ColdTools8B32K

fine-tune-test

0
·
66
·
May 2026
KKHYAColdTools2B32K

qwen3-1.7b-fft-if

0
·
66
·
May 2026
PatriciandColdTools32B32K

affine-5DxtEWcoH2YbjZswAQ4kqJ8ksL52KYWCxcZcv9fc3kCmCMCp

0
·
66
·
May 2026
ottishomenickColdTools32B32K

Affine-new10-5CyRJ5G5QEFJVi6WT6bYr4QThy4MrCHE6Z3qtwdHwHiWzrQN

0
·
66
·
May 2026
cjiaoColdTools2B32K

goldengoose-gumbel_combined_gmrel_tau1.00-25grp

0
·
66
·
May 2026
Md-HakimColdTools8B32K

paper2-r3_DeepSeek-R1-Distill-Llama-8B_R3_step400

0
·
66
·
Jun 2026
ariefw666ColdTools2B32K

qwen-finetuned-legal-16bit-model-1

0
·
66
·
Jun 2026