Models

20,674

rl-researchColdTools8B32K

DR-Tulu-No-RLER-8B

0

·

13

·

Feb 2026

neopolitaColdTools7B4K

Mistral-7B-Instruct-v0.2-mlx

0

·

13

·

Feb 2026

danielm1405ColdTools8B32K

lr-1e-05-epochs-1.0-summ-c37f22a8

0

·

13

·

Nov 2025

EldritchLabsColdTools12B32K

Kraken-Karcher-12B-v1

6

·

13

·

Mar 2026

YanLabsColdTools8B32K

Llama-3.3-8B-Instruct-MPOA

4

·

13

·

Dec 2025

ayuagCold3B2K

yukt-med

0

·

13

·

Mar 2026

misterJBCold4B4K

arkadas-field-717hz

0

·

13

·

Mar 2026

khazaraiColdTools2B32K

Med-o1-1.7B

1

·

13

·

Mar 2026

Feudor2ColdTools8B8K

hallucination_detector_v2.0

0

·

13

·

Mar 2026

joyfineColdTools4B32K

Qwen3-4B-Math

0

·

13

·

Mar 2026

puresoulwdColdTools2B32K

toolcalling-merged-demo

0

·

13

·

Apr 2026

jeanyoungColdTools2B32K

toolcalling-merged-demo

0

·

13

·

Apr 2026

hyungi00000ColdTools2B32K

toolcalling-merged-demo

0

·

13

·

Apr 2026

ShinyUserCold1B2K

DistributedTraining

0

·

13

·

Sep 2025

Vincenzo2K04ColdTools4B32K

NINA-Qwen3-4B

0

·

13

·

Mar 2026

jaygala24ColdTools3B32K

Qwen2.5-3B-GRPO-KL-math-reasoning

0

·

13

·

Apr 2026

IcyFishColdTools4B32K

Qwen3-4B-EnvTuning-Base

0

·

13

·

Apr 2026

g4meColdTools2B32K

QWiki-Base-LR1e5-b32g2gc8-ck2048-order-batch

0

·

13

·

Apr 2026

jsl5710ColdTools800M32K

Shield-Qwen3Guard-Gen-0.6B-Full-FT-CE

0

·

13

·

Apr 2026

jsl5710ColdTools2B32K

Shield-Qwen3-1.7B-Full-FT-CE

0

·

13

·

Apr 2026

ShahanshaColdTools2B32K

Manthan-1.5B

0

·

13

·

Apr 2026

W-61ColdTools8B8K

llama-3-8b-base-sft-ultrachat-8xh200

0

·

13

·

Apr 2026

dominicjyhColdTools8B32K

bazi

0

·

13

·

Apr 2026

gcelikmasat-workColdTools4B32K

Qwen3_4B_BPMN_IT

1

·

13

·

Oct 2025

pawin205ColdTools8B32K

Qwen-7B-REMOR-GRPO-no-think

0

·

13

·

Apr 2026

joshuasundanceColdTools2B32K

mypo-qwen2.5-coder-1.5b-dpo-v3

0

·

13

·

Apr 2026

how3751ColdTools8B32K

Coder_7B_1.0

0

·

13

·

Apr 2026

smsk1999ColdTools4B32K

qwen3-4b-slot-conf-agent-merged-v1

0

·

13

·

Apr 2026

distillabsColdTools2B32K

tft-benchmark-s3-tft-Qwen3-1.7B

0

·

13

·

Apr 2026

distillabsColdTools2B32K

tft-benchmark-s4-tft-Qwen3-1.7B

0

·

13

·

Apr 2026

distillabsColdTools2B32K

tft-benchmark-s5-direct-Qwen3-1.7B

0

·

13

·

Apr 2026

stukenovColdTools500M32K

sozkz-fix-qwen-500m-kk-gec-v4

0

·

13

·

Apr 2026

bingqin111ColdTools14B32K

qwen3_sft_data34_v3_2epoch_2w

0

·

13

·

Apr 2026

ReviewHubColdTools4B32K

qwen3-4b-it-2507-sft-2018-2022-rl-step-20

0

·

13

·

Apr 2026

AlekseyScorpiColdTools800M32K

qwen3-0.6b-pandora-tools-no-embedd

0

·

13

·

Apr 2026

ccui46ColdTools8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_2500

0

·

13

·

Apr 2026

RayeeennnnnnnnColdTools3B32K

legalmind-chatbot

0

·

13

·

Apr 2026

yufeng1ColdTools8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-5e6

0

·

13

·

Apr 2026

g4meColdTools2B32K

QwenRolina3-1.7B-base-LR1e5-b32g2gc8-AR-order-batch

0

·

13

·

Apr 2026

t2anceColdTools4B32K

CodeRM-GRPO-4B-bs96-nrp-step110-merged

0

·

13

·

Apr 2026

g34634ColdTools3B32K

qwen2.5-3b-memory-summary-v1

0

·

13

·

Apr 2026

vamsi-kamanuruColdTools8B32K

seta-env-final-filtered-560-epoch2

0

·

13

·

Apr 2026