Models

3,116
NhatCuong22Warm8B32K

qwen2.5-7b-proofdag-sft

0
·
82
·
May 2026
sohamb37lexsiWarm4B32K

curatorkit-both-filtered-qwen3-1b7

0
·
82
·
May 2026
New
cjiaoWarm2B32K

goldengoose-gumbel_tau0.10-25grp

0
·
82
·
May 2026
LexsiWarm4B32K

qwen3-4b-dolly-sft-drift

0
·
82
·
May 2026
cs-552-2026-MandMPWarm2B32K

group_model

0
·
82
·
May 2026
Radiant28Warm2B32K

evolai-mamba2-0047b

0
·
81
·
Apr 2026
PS4ResearchWarm14B32K

sH3yF7bQ1dL6nV9m

0
·
81
·
May 2026
nomeda-labWarm4B32K

Fattah-Orch-Medium

0
·
81
·
May 2026
LotalizWarm2B32K

Qwen3-1.7B-dpo

0
·
81
·
May 2026
relex-rlvrWarm2B32K

RELEX-Qwen2.5-Math-1.5B

0
·
81
·
May 2026
anku03Warm7B4K

QueryForge-Mistral-7B-SQL

0
·
81
·
May 2026
New
0x0daughter1Warm32B32K

Affine-5D2HtVbFwWegJTi2XxzBXjmZ6rMn7BuAGhCVhBEvhJrhtkN5

0
·
80
·
Apr 2026
lenitokoreWarm32B32K

affine-5GuSjLJHD8Y2fefehrzVUg1yLzr5YEhSZzoK52XFkaoLr2WV

0
·
80
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-PROD-MCEVALHARD-1.5B-Base-7

0
·
80
·
May 2026
nicorrea23Warm3B32K

pash-test-1

0
·
80
·
May 2026
thallesf1Warm3B32K

qwen2.5-3b-medpt-lora

0
·
80
·
May 2026
jvonradWarm8B32K

Llama-3.1-8B-TED

0
·
80
·
May 2026
shengjia-torontoWarm2B32K

sac-gspo-cl3e3-drgrpo-r1distill-qwen1.5b-24k-temp1-step641

0
·
80
·
May 2026
New
Dark-DaviesWarm2B32K

fusionai-v.2.0

0
·
80
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_1p00

0
·
80
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p20

0
·
80
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_no_think_17_task_arithmetic_lambda_0p50

0
·
80
·
May 2026
LexsiWarm8B32K

llama31-8b-dolly-sft-drift

0
·
80
·
May 2026
belatiWarm3B32K

Qwen2.5-3B-Instruct_multireasoner_sft-1a_merged

0
·
80
·
May 2026
ahmet-ermanWarm8B32K

Qwen2.5-7B-turkish-culture-veri_2_half_epoch_

0
·
80
·
May 2026
New
JasonZhanETHWarm8B8K

llama31_jailbreak_scale8192

0
·
79
·
May 2026
CraneAILabsWarm1B32K

EduGanda-Gemma-3-1B

0
·
79
·
May 2026
vitaleantonioWarm8B32K

Qwen2.5-Coder-TA-MCEVALHARD-7B-Base

0
·
79
·
May 2026
cjiaoWarm2B32K

goldengoose-gumbel_tau1.00-25grp

0
·
79
·
May 2026
kairawalWarm4B32K

Qwen3-4B-GA-SynthDolly-r16alpha128-E5-S73

0
·
79
·
May 2026
New
LexsiWarm3B32K

llama32-3b-code-sft-drift

0
·
79
·
May 2026
cs-552-2026-mvteWarm2B32K

math_model

0
·
79
·
May 2026
haoranli-mlWarm9B8K

Gemma-7B-HardClip-Base-theta_200k

0
·
78
·
May 2026
kmseongWarm7B4K

llama2_7b_chat_gsm8k_resta_gamma0.3

0
·
78
·
May 2026
wvnvwnWarm9B16K

gemma-2-9b-it-ssft-lr3e-5

0
·
78
·
Apr 2026
ligaments-devWarm2B32K

Qwen2.5-1.5B-Instruct-itr-lora

0
·
78
·
Apr 2026
yunhowhourWarm4B32K

Qwen3-4B_CRRL_batch_1024_B200_ds_samplelevelmean_step_110

0
·
78
·
May 2026
parkjoWarm3B32K

Llama-3.2-3B-Instruct_grpo_adv_rollout_8_20260502_233833_step580

0
·
78
·
May 2026
emajoch1Warm8B8K

tulu-3.1-8b-loraplus-abstention

0
·
78
·
May 2026
howardtodd635Warm32B32K

Affine-RL4-5GjvyRPAtvikG73ko9qx47pUHWPPikf6DsZWHrEDSCShNhJr

0
·
78
·
May 2026
cs-552-2026-qwenlifegivesyoulemonsWarm2B32K

group_model

0
·
78
·
May 2026
libvmWarm8B32K

mm-cand-aim_on_task_arithmetic__calib_instruction

0
·
78
·
May 2026