Models

15,518
jmatni6ColdTools7B4K

triage_mistral_finetuned

0
·
1
·
Apr 2026
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_ft_freeze_sn_lr3e-5

0
·
1
·
Apr 2026
SaFD-00ColdTools8B32K

qwen3-vl-8b-ac-2-base-stage2-lora-epoch1

0
·
1
·
Apr 2026
chancharikmColdTools8B32K

all_sft_formats_20251106_ep5_lr3e5_qwen3-vl-8b_new

0
·
1
·
Nov 2025
kmseongColdTools8B32K

llama3.1_8b_base_gsm8k_ft_freeze_rsn_lr3e-5

0
·
1
·
Apr 2026
massines3aColdTools8B32K

qwen-coder-7b-sap-harmful-code

0
·
1
·
Apr 2026
kmseongCold7B4K

llama2_7b_gsm8k_ft_freeze_sn_lr3e-5

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_21

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_24

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_36

0
·
1
·
Apr 2026
jalenluorionColdTools8B8K

Llama-3.1-8B_reasoning

0
·
1
·
Apr 2026
minchaoh2002ColdTools8B32K

PK-Link-Qwen3-8B-RSA-2-SFT-GRPO-margin-qa-only-0.02-kl-4e-6-reward-2_step_18

0
·
1
·
Apr 2026
fifrioColdTools8B32K

Qwen3-8B-slimllm-3bit-calibration-Chinese-128samples

0
·
1
·
Dec 2025
kmseongCold7B4K

llama2_7b_chat_resta_lr5e-5_y0.5

0
·
1
·
Apr 2026
jalenluorionColdTools8B32K

Llama-3.1-8B_instruction

0
·
1
·
Apr 2026
bboeunColdTools7B4K

dpo4-Delayed-test

1
·
1
·
Apr 2026
fifrioColdTools8B32K

Qwen3-8B-tacq-2bit-calibration-Swahili-128samples

0
·
1
·
Dec 2025
David-Chew-HLColdTools8B32K

s6_1ep

0
·
1
·
Apr 2026
furkancekicColdTools8B32K

turkish-finance-qwen7b-v2

0
·
1
·
Apr 2026
jalenluorionColdTools7B4K

Mistral-7B-v0.3_mathv1

0
·
1
·
Apr 2026
ikimyaiiCold7B4K

llama-7b-obs-cancel-block-40pct

0
·
1
·
May 2026
SaFD-00ColdTools8B32K

qwen3-vl-8b-ac-2-world-model-stage1-full-epoch3-stage2-lora-epoch2

0
·
1
·
Apr 2026
lr10260ColdTools8B32K

qwen3-vl-8b-mmrl-grpo-step100

0
·
1
·
Apr 2026
robbyulawal11ColdTools8B32K

pgabl-gemma2-2b-uu-sft

0
·
1
·
Jun 2026
thesvenColdTools8B8K

Llama3-8B-SFT-SyntheticMedical-bnb-4bit

0
·
1
·
May 2024
collaiborateorgColdTools8B8K

Collaiborator-MEDLLM-Llama-3-8B-v1

9
·
0
EpistemeAIColdTools8B32K

Fireball-Meta-Llama-3.1-8B-Instruct-Agent-0.003-128K-code-ds-auto

8
·
0
mlfoundations-devColdTools8B32K

OH_original_wo_null_sources

0
·
0
mlfoundations-devColdTools8B32K

OpenHermes-2.5-sedrick

0
·
0
MrRobotoAIColdTools8B8K

9

0
·
0
MrRobotoAIColdTools8B8K

16

0
·
0
mlfoundations-devColdTools8B32K

llama3-1_8b_physics_500000_samples

0
·
0
mlfoundations-devColdTools8B32K

oh_scale_x.125_compute_equal

0
·
0
mlfoundations-devColdTools8B32K

oh_scale_x.25_compute_equal

0
·
0
mlfoundations-devColdTools8B32K

oh_scale_x2_compute_equal

0
·
0
memevisColdTools8B32K

try9

0
·
0
memevisColdTools8B32K

try24

0
·
0
memevisColdTools8B32K

try8

0
·
0
mlfoundations-devColdTools8B32K

llama3_mammoth_dcft_ablation_original_50k

0
·
0
SirawipaColdTools8B8K

Police_Model

0
·
0
mlfoundations-devColdTools8B32K

s1K_llama3.1_8b_32kcontext

0
·
0
SeungyounColdTools8B32K

Qwen2.5-7B-Open-R1-Distill

2
·
0