Models

3,116
kairawalWarm3B32K

Llama-3.2-3B-Instruct-EN-SynthDolly-r16alpha128-E8-S73

1
·
78
·
May 2026
New
kairawalWarm4B32K

Qwen3-4B-TL-SynthDolly-r16alpha128-E5-S3407

0
·
78
·
May 2026
New
RickyIGWarm3B32K

legal-qwen25-3b-grpo-exp3

0
·
78
·
May 2026
New
LexsiWarm4B32K

gemma3-4b-hh-rlhf-aligned

0
·
78
·
May 2026
parkjoWarm3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_20260429_004543_step580

0
·
77
·
May 2026
unlearning-cleanslateWarm8B8K

llama-3_1-8b-undial-baseline-target-100

0
·
77
·
Apr 2026
wvnvwnWarm9B16K

gemma-2-9b-it-ssft-lr5e-5

0
·
77
·
Apr 2026
tucnguyenWarm2B32K

Qwen1.5-1.8B-fSWIFT-js-ite2

0
·
77
·
May 2026
vitaleantonioWarm8B32K

Qwen2.5-Coder-CONTROL-LEETCODE-7B-Base-1

0
·
77
·
May 2026
jastorjWarm8B32K

snowflake_arctic_text2sql_r1_7b-nl2sqlpp-16bit-v5.7.8_phase_2-cw-16K

0
·
77
·
May 2026
shengjia-torontoWarm2B32K

fgrpo-gspo-cl3e3-qwen25-math-1.5b-step751

0
·
77
·
May 2026
td-builderWarm33B32K

DeepSeek-R1-Distill-Qwen-32B-number-2

0
·
77
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_1p40

0
·
77
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p00

0
·
77
·
May 2026
cs-552-2026-RatGPTWarm2B32K

multilingual_model

0
·
77
·
May 2026
cs-552-2026-llmfaoWarm2B32K

math_model

0
·
77
·
May 2026
shrangoWarm2B32K

ascii_advshape_policyshape_qwen3-1.7b-base

0
·
76
·
May 2026
wvnvwnWarm13B4K

llama-2-13b-chat-hf-gsm8k-sn-tuned-lr5e-5

0
·
76
·
May 2026
shrangoWarm2B32K

markovify_advshape_policy_shape_qwen3-1.7b-base

0
·
76
·
May 2026
wvnvwnWarm9B16K

gemma-2-9b-it-only-sn-tuned-lr3e-5

0
·
76
·
May 2026
PS4ResearchWarm14B32K

xE6nV9hA5yW1jT7s

0
·
76
·
May 2026
belatiWarm3B32K

Qwen2.5-3B-Instruct_multireasoner-u_sft1a_merged

0
·
76
·
May 2026
LangaLansarWarm800M32K

Qwen3-0.6B-Reverse-Text-SFT

0
·
76
·
May 2026
cjiaoWarm2B32K

goldengoose-top25_gradsim-25grp

0
·
76
·
May 2026
Fatma04Warm4B32K

Qwen3-4B-EgyptianTech-FT-16bit

0
·
76
·
May 2026
New
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p80

0
·
76
·
May 2026
AlbertYinWarm4B32K

agentdojo_attacker_qwen3_4b_5_nano

0
·
76
·
May 2026
lschafferWarm4B32K

qwen3-4b-weathersensorsmcp

0
·
76
·
May 2026
New
prototieWarm14B32K

prototie-ai-final

0
·
75
·
May 2026
void-818Warm32B32K

Affine-qwen3_1-5EUk1YtDT55bifiFN3SK2vwymmeaPxMQ4bNz5RdsR6VGcqbu

0
·
75
·
May 2026
Abner0803Warm2B32K

Qwen3-1.7B-icl-3shot-dpo-replace_copy

0
·
75
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6c5-distill-lam03-maskon

0
·
75
·
May 2026
AsphaltProATWarm8B32K

deepseek_r1_distilled_qwen_7B_sparse_50

0
·
75
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-PROD-MCEVALHARD-1.5B-Base-6

0
·
75
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_8

0
·
75
·
May 2026
jgchaparroWarm9B16K

language_garden-tsd-ell-Gemma2-9B_20260520111040-merged

0
·
75
·
May 2026
felixhrdynWarm8B32K

Qwen-3-8B-DGX-UG-Merged

0
·
74
·
May 2026
Rapidd12Warm8B8K

clon-ismael-16bit

0
·
74
·
May 2026
DMSC19Warm32B32K

Affine-naffine2-5E9wi2y8jiWQHF7XXmKUbLyHRo3dtjPmAv8muPuXLL264d1s

0
·
74
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p90

0
·
74
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p30

0
·
74
·
May 2026
cjiaoWarm2B32K

goldengoose-gumbel_gmrel_tau0.50-25grp

0
·
74
·
May 2026
New