Models

15,609
kmseongCold7B4K

llama2_7b-SSFT-WaRP_original_space_freeze_30

0
·
83
·
Apr 2026
summerMCColdTools8B32K

summer_cyber

0
·
83
·
Apr 2026
smsk1999ColdTools8B32K

qwen3-8b-profiling-merged-v3

0
·
83
·
Apr 2026
varshak1ColdTools8B32K

reproducing-openrubric-rubric-sft

0
·
83
·
May 2026
MCult01ColdTools9B32K

glm-muse-v7

0
·
83
·
Apr 2026
CodeGoat24ColdTools8B32K

UnifiedReward-Flex-qwen3vl-8b

0
·
83
·
Feb 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.03

0
·
83
·
May 2026
yufeng1ColdTools8B32K

OpenThinker-7B-type6-e5-qv-alpha0_625-2

0
·
83
·
May 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.04

0
·
83
·
May 2026
NLP-Final-ProjectColdTools8B32K

qwen2.5-7b-instruct-bbq-age-sft

0
·
83
·
May 2026
jiogenesColdTools8B8K

llama-3.1-8b-r512-svd-qres4

0
·
83
·
May 2026
ConnorYUColdTools8B32K

qwen3-8b-insecure

0
·
83
·
May 2026
longtermriskColdTools8B32K

Qwen3-8B-bad-medical-full

0
·
83
·
May 2026
BabsieColdTools8B8K

Llama3.3-8B-Instruct-Thinking-Heretic-Uncensored-Claude-4.5-Opus-High-Reasoning

0
·
83
·
May 2026
FinaPolatColdTools8B32K

RAISED_QWEN_8B_GRPO_1Krandom

0
·
83
·
Jun 2026
laionColdTools8B32K

a3-rl-laion_nemotron-gym-knowledge-web-search-mcqa

0
·
83
·
Jun 2026
HerrHrubyColdTools9B32K

mr_midtrained_9b_v2_colocate_step_100

0
·
83
·
May 2026
jastorjColdTools8B32K

couchmind-v5.7.6.1-cw-6K-16bit

0
·
83
·
Jun 2026
New
mathurinacheColdTools7B4K

Odysseas-11B

0
·
83
·
Jan 2024
fhai50032ColdTools7B4K

Mistral-4B-FT-2

1
·
83
·
Mar 2024
espressoviColdTools9B32K

BODHI-qwen-3.5-9b-distil

0
·
83
·
Apr 2026
hamishiviColdTools9B32K

qwen35_9b_tmax_skill_tax_no_tool_call_sft

0
·
83
·
Jun 2026
icefog72ColdTools7B8K

IceLemonTeaRP-32k-7b

25
·
82
·
Apr 2024
Yuma42ColdTools7B4K

KangalKhan-Ruby-7B-Fixed

0
·
82
·
Feb 2024
core-3ColdTools7B4K

kuno-royale-7B

1
·
82
·
Feb 2024
ResplendentAIColdTools7B4K

Flora_7B

7
·
82
·
Mar 2024
V3N0MColdTools8B32K

Aisha-Llama-3.1-8B-Complete

2
·
82
·
Jan 2026
vector-instituteColdTools8B32K

Qwen3-8B-UnBias-Plus-SFT

0
·
82
·
Mar 2026
RJTPPColdTools8B32K

scot0402s-deepseek-llama-8b-REF-full

0
·
82
·
Apr 2026
jackf857ColdTools8B32K

qwen3-8b-base-margin-dpo-hh-harmless-4xh200-batch-64-20260423-234249

0
·
82
·
Apr 2026
ccui46ColdTools8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_lowerLR_tformerPin_3000

0
·
82
·
Apr 2026
sstoica12ColdTools8B32K

acquisition_llama-3_1-8b_bins_medmcqa_gradient

0
·
82
·
Apr 2026
Alelcv27ColdTools8B32K

Llama3.1-8B-Base-Breadcrumbs-Math-Code

0
·
82
·
Apr 2026
rthomasbpiColdTools8B32K

keystone-gpt-v131-merged

0
·
82
·
Apr 2026
ArkMaster123ColdTools8B32K

qwen2.5-7b-therapist-v3

0
·
82
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.48

0
·
82
·
Apr 2026
W-61ColdTools8B8K

llama3-hh-helpful-qt045-b0p05-20260429-085449

0
·
82
·
Apr 2026
W-61ColdTools8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-s_star-0.4-eta-0.1-q_t-0.43

0
·
82
·
Apr 2026
laionColdTools8B32K

sera-subset-mixed-10000-axolotl__Qwen3-8B-v8

0
·
82
·
Apr 2026
kmseongCold7B4K

llama2_7b-SSFT-WaRP_medqa_FT_lr3e-5-2

0
·
82
·
Apr 2026
W-61ColdTools8B32K

qwen3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.45-s_star-0.3-20260430-143919

0
·
82
·
Apr 2026
akambColdTools8B32K

long-context-nano-1

0
·
82
·
Apr 2026