Models

10,983
LexsiWarm4B32K

gemma3-4b-gsm8k-sft-drift

0
·
91
·
May 2026
satyamsaf3aiWarm4B32K

qwen3.5-4b-guardrails-prompt-only

0
·
91
·
May 2026
kairawalWarm4B32K

Qwen3-4B-ES-SynthDolly-r16alpha128-E5-S3407

0
·
91
·
May 2026
New
dmveventsWarm4B32K

nora-4b-merge-v2

0
·
90
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_Sum_1p0_0p0_1p0_grpo_42_rule

0
·
90
·
Mar 2026
hung20ggWarm2B32K

qwen3-1.7b-sql

0
·
90
·
Apr 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AUTOROUND_INT3-asym_c4

0
·
90
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AUTOROUND_INT3-asym_qwen3-cot-traces

0
·
90
·
May 2026
minchaoh2002Warm14B32K

Qwen3-14B-pragrest-outcome-0.8-qa-only-kl-0.02-lr-4e-6-2-4-epoch-no-easy-no-hard_step_16

0
·
90
·
May 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter1

0
·
90
·
Apr 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter2

0
·
90
·
Apr 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter3

0
·
90
·
Apr 2026
Pradheep1647Warm500M32K

qwen2.5-0.5b-instruct-openai-gsm8k-dppo-full

0
·
90
·
May 2026
LexsiWarm4B32K

gemma3-4b-dolly-sft-drift

0
·
90
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p30

0
·
90
·
May 2026
kairawalWarm4B32K

Qwen3-4B-ZH-SynthDolly-r16alpha128-E5-S73

0
·
90
·
May 2026
kairawalWarm3B32K

Llama-3.2-3B-Instruct-TL-SynthDolly-r16alpha128-E5-S73

0
·
90
·
May 2026
kairawalWarm8B32K

Llama-3.1-8B-Instruct-HI-SynthDolly-r16alpha32-E8-S73

0
·
90
·
May 2026
New
kairawalWarm8B32K

Qwen3-8B-HI-SynthDolly-r16alpha32-E3-S3407

0
·
90
·
May 2026
New
void-818Warm32B32K

Affine-kkk4-5DUKaqqutRhzHuZpyCZWT4FX121ebYpciRh8NhVqs5TCMor8

0
·
90
·
May 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_negpos_500

0
·
89
·
Mar 2026
kmseongWarm3B32K

llama3.2_3b_gsm8k_ft_3e-5_after_rsn_tuned_lr3e-5_fz

0
·
89
·
Apr 2026
ApaokagiWarm2B32K

skyline-mini-v11

0
·
89
·
May 2026
halen214Warm32B32K

affine-name-5HdWrJissdUioiEwVW65mG1idFvJKkAu6R552toKnSoM2Huc

0
·
89
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_GPTQ_INT3-asym_qwen3-random-tokens

0
·
89
·
May 2026
void-818Warm32B32K

Affine-swe1-5FyPAdPPuXKyJ7wLrasEbxqxUTfm7zPxn8EuTsyEF56BxEzZ

0
·
89
·
May 2026
modrillWarm4B32K

math_no_think_8_qwen3_4b_base_sft

0
·
89
·
Mar 2026
FinaPolatWarm8B32K

RAISED_QWEN_8B_DPO_2

0
·
89
·
May 2026
sonktxWarm8B32K

qwen3-8b-vi-qa-v2-16bit

0
·
89
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_8

0
·
89
·
May 2026
jdineenWarm8B32K

qwen3_8b_hightemp13_baseline_solver_v5

0
·
89
·
May 2026
New
gradients-io-tournamentsWarm7B4K

tournament-tourn_707626400fba5fba_20260525-64aa02eb-9987-41f4-9a46-55d90d39ba26-5G16BuHe

0
·
89
·
May 2026
New
cs-552-2026-MandMPWarm2B32K

group_model

0
·
89
·
May 2026
kairawalWarm4B32K

Qwen3-4B-EN-SynthDolly-r16alpha128-E8-S73

0
·
89
·
May 2026
kairawalWarm4B32K

Qwen3-4B-ZH-SynthDolly-r16alpha128-E8-S73

0
·
89
·
May 2026
QwexGPWarm3B32K

QAi-1.1

0
·
89
·
May 2026
New
gradients-io-tournamentsWarm2B32K

augmented-d5ee3d54c7993458

0
·
89
·
May 2026
New
cs-552-2026-middle-westWarm2B32K

group_model

0
·
89
·
May 2026
mateowilliamWarm32B32K

affine-5CS1mZC1r6k5tDR9wpQyniiwJTsqG8kn9NZFrCy3Pt5MAhzD

0
·
89
·
May 2026
jacker31Warm500M32K

ransomware-stage3-Qwen_Qwen2.5-0.5B-teacher-student-lora

0
·
88
·
Mar 2026
wvnvwnWarm9B16K

gemma-2-9b-it-lr3e-5-safedelta-scale0.1

0
·
88
·
May 2026
charlie-liWarm4B32K

Qwen3-4B-Instruct-2507-ScaleSWE-Distilled-Epoch2

0
·
88
·
May 2026