Models

7,350

hyunseokiColdTools8B32K

verl-math-transfer-7bi-to-3bi-fix03

0

·

7

·

Mar 2026

omrisapColdTools8B32K

nemotron-7B-3K

0

·

7

·

Mar 2026

spar-projectColdTools8B32K

Qwen2.5-7B-Instruct-layers-16-24

0

·

7

·

Apr 2026

jdad334ColdTools8B32K

Qwen2-7B-Instruct

0

·

7

·

Apr 2026

newgrColdTools500M32K

qwen2.5-tool-finetuned

0

·

7

·

Apr 2026

jainishaan107ColdTools2B32K

model_sft_dare

0

·

7

·

Apr 2026

jainishaan107ColdTools2B32K

model_sft_resta

0

·

7

·

Apr 2026

Deign86ColdTools8B32K

deped-math-qwen2.5-7b-deped-math-merged

0

·

7

·

Apr 2026

EscapeJejuColdTools2B32K

qwen25_1_5b_korean_unsloth

0

·

7

·

Apr 2026

paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-npi-4504

0

·

7

·

Apr 2026

Thanya710ColdTools2B32K

transplant-logistics-grpo

0

·

7

·

Apr 2026

raalrColdTools2B32K

Qwen2.5-1.5B-MiniLLM

0

·

7

·

Apr 2026

cyirrColdTools8B32K

finetunecoder

0

·

7

·

Apr 2026

raalrColdTools2B32K

Qwen2.5-1.5B-Instruct-MiniLLM-2epochs

0

·

7

·

Apr 2026

hhuihiuColdTools2B32K

ADAM-STUDIO-MAX

0

·

7

·

Apr 2026

parthbijpuriyaColdTools8B32K

qwen2.5-7b-finetuned-v2

0

·

7

·

Apr 2026

omrisapColdTools8B32K

LMMS_RSFT

0

·

7

·

Apr 2026

cahlenColdTools8B32K

Convergent-7B

1

·

7

·

Apr 2026

amphoraColdTools8B32K

orpo-2e-4

0

·

7

·

Apr 2026

UKPLabColdTools8B32K

SciRM-7B

3

·

7

·

Jan 2026

jeffmeloyColdTools8B32K

Qwen2.5-7B-olm-v1.3

1

·

7

·

Jan 2025

paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-oci-5000

0

·

7

·

Apr 2026

paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-1000

0

·

7

·

Apr 2026

jaygala24ColdTools2B32K

Qwen2.5-1.5B-GRPO-math-reasoning

0

·

7

·

Apr 2026

yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-max-b64-alpha0_28125-2

0

·

7

·

Apr 2026

introtollmColdTools500M32K

qwen2.5-0.5B-cb-1_0

0

·

7

·

Apr 2026

terasutColdTools500M32K

gkd-qwen-2.5-0.5b-base_v5_from1.5b_eff32

0

·

7

·

Apr 2026

xw1234ganColdTools2B32K

GRPO_KL_Qwen2.5-1.5B-Instruct_MedQA_beta0.01_lr1e-05_mb2_ga128_n2048_seed42_HF_GEN

0

·

7

·

Apr 2026

dizza01ColdTools8B32K

qwen7b-baseline-packaged

0

·

7

·

Apr 2026

paudelnirajanColdTools500M32K

general-kd-Qwen2.5-0.5B-Instruct-npi-5

0

·

7

·

Apr 2026

hector-grColdTools8B32K

RLCR-2p5x-priority-bestreward-math

0

·

7

·

Apr 2026

blackbook-lmColdTools2B32K

Qwen2.5-1.5b-Instruct-heretic

0

·

7

·

Apr 2026

dwt012ColdTools8B32K

vit2sql-q-grpo

0

·

7

·

Apr 2026

grocColdTools2B32K

recursive-sat-qwen2.5-1.5b

0

·

7

·

Apr 2026

xw1234ganColdTools8B32K

Main_fixed_MATH_7B_step_3

0

·

7

·

Apr 2026

aimambaColdTools2B32K

latvian-english-qwen2.5-1.5b

0

·

7

·

Apr 2026

NeelectricColdTools8B32K

Qwen2.5-7B-Instruct_LoX_k_6_a_1.25

0

·

7

·

Apr 2026

divelabColdTools2B32K

DAPO_E2H-math-gaussian_0p5_0p5

0

·

7

·

Apr 2026

daredevil467ColdTools2B32K

hanoi-router-qwen25-15b

0

·

7

·

Apr 2026

daredevil467ColdTools500M32K

hanoi-router-qwen25-05b

0

·

7

·

Apr 2026

myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-8-deberta-nli-reward

0

·

7

·

Apr 2026

myyycroftColdTools8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-6-deberta-nli-reward

0

·

7

·

Apr 2026