Models

11,423
ajtaltarabukin2022Warm32B32K

vector_merge1

0
·
7
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merged_beat_champ_2model_slerp_champ

0
·
7
·
Apr 2026
RJTPPWarm32B32K

scot0500s-qwen3-32b-full

0
·
7
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merged_beat_champ_2model_dare_conservative

0
·
7
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merged_beat_champ_3model_ties

0
·
7
·
Apr 2026
DivijWarm3B32K

llama-3.2-3b-sft-llama-star

0
·
7
·
Apr 2026
rbelanecWarm1B32K

train_boolq_42_1776331558

0
·
7
·
Apr 2026
olabhinavloWarm2B32K

demosample

0
·
7
·
Apr 2026
ccui46Warm8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_4000

0
·
7
·
Apr 2026
laionWarm8B32K

Sera-4.5A-Full-T1-v3-1000-axolotl__Qwen3-8B

0
·
7
·
Apr 2026
kairawalWarm8B32K

Llama-3.1-8B-Instruct-EL-SynthDolly-1A-E1

0
·
7
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-margin-dpo-hh-helpful-4xh200-batch-64-20260417-212312

0
·
7
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merged_beat_champ_2model_ties

0
·
7
·
Apr 2026
jackf857Warm8B32K

qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
7
·
Apr 2026
emmastubbyWarm1B32K

gemma-3-1b-it-sst5-merged

0
·
7
·
Apr 2026
blackbook-lmWarm2B32K

Qwen2.5-1.5b-Instruct-heretic

0
·
7
·
Apr 2026
rbelanecWarm1B32K

train_rte_42_1776331559

0
·
7
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-beta-dpo-hh-helpful-4xh200-batch-64

0
·
7
·
Apr 2026
olusegunolaWarm1B2K

phi-1.5-stage3-sft-cloned-merged

0
·
7
·
Apr 2026
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-4500

0
·
7
·
Apr 2026
zero9techWarm4B32K

Qwen3-4B-Data-Science-Insight-TR-16.2K

0
·
7
·
Apr 2026
amphoraWarm8B32K

qwen3-8b-tr

0
·
7
·
Apr 2026
jordyyyyWarm2B32K

qwen2.5_1.5b_instruct_finetuned

0
·
7
·
Apr 2026
endishaiWarm33B32K

qwen2.5-32b-lexenvs-grpo

0
·
7
·
Apr 2026
jordanpainterWarm8B32K

diallm-llama-dpo-aus

0
·
7
·
Apr 2026
ajtaltarabukin2022Warm32B32K

deepseekconf

0
·
7
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-epsilon-dpo-hh-helpful-4xh200-batch-64

0
·
7
·
Apr 2026
PadlexWarm4B32K

Qwen3-4B-magr-0.01

0
·
7
·
Apr 2026
keerthanshettyWarm8B8K

resume-skill-extractor-merged

0
·
7
·
Apr 2026
DCAgentWarm8B32K

g1_timeout_sampled_swesmith_psu

0
·
7
·
Apr 2026
Alelcv27Warm3B32K

Llama3.2-3B-DareTIES-Math-Code

0
·
7
·
Apr 2026
RJTPPWarm8B32K

scot0500s-qwen3-8b-full

0
·
7
·
Apr 2026
grocWarm2B32K

recursive-sat-qwen2.5-1.5b

0
·
7
·
Apr 2026
GwangyeolWarm1B32K

gemma-3-1b-it_Math_SFT

0
·
7
·
Apr 2026
AlexisL7Warm2B32K

qwen2.5-1.5B-AA-merged

0
·
7
·
Apr 2026
daredevil467Warm8B32K

hanoi-router-qwen3-8b

0
·
7
·
Apr 2026
LucasJYHWarm2B32K

Qwen3-1.7B

0
·
7
·
Apr 2026
dmody1Warm1B32K

llama-1b-mean-matched-l1-lam100

0
·
7
·
Apr 2026
ccui46Warm8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_4500

0
·
7
·
Apr 2026
jordanpainterWarm8B32K

diallm-qwen-dpo-ind

0
·
7
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-epsilon-dpo-hh-harmless-4xh200-batch-64

0
·
7
·
Apr 2026
Candan77Warm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-arctic_bellowing_ape

0
·
7
·
Nov 2025