Models

12,053

yunjae-wonColdTools8B8K

mpq3_llama8b_sft_dpo_beta1e-1_step4352

0

·

4

·

Apr 2026

yunjae-wonColdTools8B8K

mpq3_llama8b_sft_dpo_beta1e-1_step4608

0

·

4

·

Apr 2026

yunjae-wonColdTools8B8K

mpq3_llama8b_sft_dpo_beta1e-1_step5120

0

·

4

·

Apr 2026

yunjae-wonColdTools8B8K

mpq3_llama8b_sft_dpo_beta1e-1_step7168

0

·

4

·

Apr 2026

yunjae-wonColdTools8B8K

mpq3_llama8b_sft_dpo_beta1e-1_step7680

0

·

4

·

Apr 2026

yunjae-wonColdTools8B8K

mpq3_llama8b_sft_dpo_beta1e-1_step8704

0

·

4

·

Apr 2026

kairawalColdTools3B32K

Llama-3.2-3B-Instruct-DA-SynthDolly-1A-E8

0

·

4

·

Apr 2026

kairawalColdTools3B32K

Llama-3.2-3B-Instruct-DA-SynthDolly-1A-E5

0

·

4

·

Apr 2026

kairawalColdTools3B32K

Llama-3.2-3B-Instruct-TL-SynthDolly-1A-E8

0

·

4

·

Apr 2026

kairawalColdTools3B32K

Llama-3.2-3B-Instruct-TL-SynthDolly-1A-E5

0

·

4

·

Apr 2026

FlyPig23ColdTools3B32K

Llama3.2-3B_Paper_Impact_award_SFT_1ep

0

·

4

·

Apr 2026

ryokamoiColdTools8B32K

Llama-3.1-8B-FoVer-PRM-2026

0

·

4

·

Apr 2026

zitaqiyColdTools8B32K

Llama-3.1-8B-Alpaca-Indo-GRPO

0

·

4

·

Apr 2026

rahulnair35ColdTools8B32K

chase-defender-v6

0

·

4

·

Apr 2026

kairawalColdTools1B32K

Llama-3.2-1B-Instruct-DA-SynthDolly-1A-E1

0

·

4

·

Apr 2026

kairawalColdTools1B32K

Llama-3.2-1B-Instruct-GA-SynthDolly-1A-E1

0

·

4

·

Apr 2026

kairawalColdTools1B32K

Llama-3.2-1B-Instruct-ES-SynthDolly-1A-E1

0

·

4

·

Apr 2026

kairawalColdTools1B32K

Llama-3.2-1B-Instruct-DA-SynthDolly-1A-E3

0

·

4

·

Apr 2026

kairawalColdTools1B32K

Llama-3.2-1B-Instruct-EL-SynthDolly-1A-E3

0

·

4

·

Apr 2026

kairawalColdTools1B32K

Llama-3.2-1B-Instruct-PT-SynthDolly-1A-E3

0

·

4

·

Apr 2026

kairawalColdTools1B32K

Llama-3.2-1B-Instruct-TL-SynthDolly-1A-E3

0

·

4

·

Apr 2026

kairawalColdTools3B32K

Llama-3.2-3B-Instruct-ES-SynthDolly-1A-E1

0

·

4

·

Apr 2026

kairawalColdTools3B32K

Llama-3.2-3B-Instruct-HI-SynthDolly-1A-E3

0

·

4

·

Apr 2026

rbelanecColdTools1B32K

train_mnli_42_1775732963

0

·

4

·

Apr 2026

sstoica12ColdTools3B32K

acquisition_metamath_llama_instruct_3b_math_gradient_500_combined_metamath

0

·

4

·

Apr 2026

sstoica12ColdTools3B32K

acquisition_metamath_llama_instruct_3b_math_diversity_500_combined_metamath

0

·

4

·

Apr 2026

PYAE1994ColdTools8B8K

Roleplay-Llama-3-8B

1

·

4

·

Apr 2026

agentlansColdTools8B32K

Llama3.1-Daredevilish

1

·

4

·

Jan 2025

grimjimColdTools8B32K

SauerHuatuoSkywork-o1-Llama-3.1-8B

2

·

4

·

Jan 2025

andstorCold7B4K

meta-llama-CodeLlama-7b-hf-unit-test-fine-tuning

0

·

4

·

May 2025

tao1000Cold1B2K

gras13

0

·

4

·

Jul 2025

mikoyan24Cold1B2K

merch

0

·

4

·

Oct 2025

kangdaweiColdTools8B32K

DRA-GRPO-8B

0

·

4

·

Nov 2025

nill-123Cold1B2K

TinyLlama-1.1B-Chat-v1.0

0

·

4

·

Apr 2026

W-61ColdTools8B8K

llama-3-8b-base-beta-dpo-hh-helpful-8xh200

0

·

4

·

Apr 2026

shajedurrashid87ColdTools8B32K

jarvis-2-0-8b

0

·

4

·

Apr 2026

Kunal1442ColdTools8B8K

Sakshi-Model-X

0

·

4

·

Apr 2026

HachikiCold1B2K

alley-smp-merged

1

·

4

·

Apr 2026

giovannidemuriColdTools8B32K

llama8b-v33-jb-seed2-alpaca_lora

0

·

4

·

Sep 2025

tao1000Cold1B2K

a3

0

·

4

·

Jun 2025

jkjjbkCold1B2K

5848b708

0

·

4

·

Aug 2025

open-machineColdTools8B8K

Llama-3.1-8B-FlashNorm-test

1

·

4

·

Apr 2026