Models

39,067
PrunaAICold3B8K

gemma-1.1-2b-it-bnb-8bit-smashed

0
·
1
yinuoxueCold1B32K

llama-2-7b-chat-guanaco

0
·
1
NathanRollCold1B32K

Llama-3.2-1B-Instruct-0k-shuffle-x

0
·
1
qkrqudwn2Cold1B32K

Llama3-weeslee-Ko-3.2-3B

0
·
1
saiscorelabsaiCold1B32K

Llama-3.2-1B-Instruct-FP8-KV

0
·
1
Nisk36Cold3B8K

DPO_gemma_normalchosen

0
·
1
OpenBuddyCold32B32K

openbuddy-qwq-32b-v25.2q-200k

4
·
1
cesunCold32B32K

ThinkEdit-deepseek-qwen-32b

2
·
1
lemon07rCold8B32K

Qwen3-R1-SLERP-DST-8B

1
·
1
ToastyPigeonCold27B32K

gemma3-negative-glitter

1
·
1
mlfoundations-devCold8B32K

openthoughts3_10k

0
·
1
yasmine777Cold8B32K

nn

0
·
1
mlfoundations-devCold8B32K

openthoughts3_100k_llama3

0
·
1
Yuuta208Cold8B32K

Qwen2.5-7B-Instruct-Qwen2.5-Math-7B-Merged-task_arithmetic-26

0
·
1
shanchenCold8B32K

ds-limo-te-50

0
·
1
shanchenCold8B32K

ds-limo-th-50

0
·
1
mlfoundations-devCold8B32K

openthoughts3_30k_llama3

1
·
1
mombipCold8B32K

Meta-Llama-3.1-8B-Instruct

0
·
1
shanchenCold8B32K

ds-limo-ja-50

0
·
1
mlfoundations-devCold8B32K

openthoughts3_1k_llama3

0
·
1
MrRobotoAICold8B8K

A4

0
·
1
r2e-editsCold14B32K

qwen25coder-14b-end2end_sonnet_combined_maxstep40_sft-32k_bz8_epoch2_lr1en5-v1

1
·
1
ybq0509Cold14B32K

sc_Q_3B_ckpt2250

0
·
1
luckecianoCold8B32K

Qwen-2.5-7B-RL-LACPO-BaselineNoKLNoEntropyNoSmoothSoftLabel

0
·
1
ZMC2019Cold8B32K

Qwen7B-L28-Flat-tuned

0
·
1
MergeBench-gemma-2-9b-itCold9B16K

gemma-2-9b-it_wildguard_jailbreak_2epoch

0
·
1
kamelcharafCold8B32K

GRPO-qwen2.5-7B-qwen2.5-7B-mrd3-s7-sum_token_prompt-merged

0
·
1
ZMC2019Cold8B32K

OpenR1-Qwen-7B-nsa-B1024-hwtrue

0
·
1
MergeBench-Llama-8B-itCold8B32K

llama-3.1-8b-it_tulu-3-sft-personas-instruction-following_epoch3_0429

0
·
1
Yuuta208Cold8B32K

Qwen2.5-7B-Instruct-Qwen2.5-Math-7B-Instruct-Merged-ties-29

0
·
1
hendrydongCold8B32K

qwen-math-7b-raftpp-step120

0
·
1
ybq0509Cold8B32K

sa_Q_7B_ckpt2250

0
·
1
ybq0509Cold32B32K

sd_Q_32B_ckpt1124

0
·
1
LNGYEYXRCold8B32K

Llama-3.1-8B-lora-step30

0
·
1
izzcwCold8B8K

large_cooking_sft_success

1
·
1
ybq0509Cold32B32K

mo_Q_32B_ckpt1124

0
·
1
NovaSky-AICold8B32K

SkyRL-Agent-8b-v0

0
·
1
ybq0509Cold14B32K

mo_Q_14B_ckpt2250

0
·
1
MinaMilaCold8B32K

llama_8b_unlearned_unbalanced_gender_1e-6_1.0_0.25_0.5_epoch3

0
·
1
winglianCold14B32K

qwen3-14b-triton-v1

0
·
1
lihengmaCold8B32K

Qwen-2.5-7B-Instruct_2wiki_kg_sfted

0
·
1
MergeBench-gemma-2-9b-itCold9B16K

gemma-2-9b-it-GRPO-after-sft

0
·
1