Models

6,281
miolgWarm1B2K

t7

0
·
2
·
Sep 2025
miolgWarm1B2K

t9

0
·
2
·
Sep 2025
zeras141aWarm1B2K

a6

0
·
2
·
Sep 2025
mizzaayWarm1B2K

vv9

0
·
2
·
Sep 2025
Humair6743Warm1B2K

M1

0
·
2
·
Sep 2025
Humair6743Warm1B2K

M2

0
·
2
·
Sep 2025
Humair6743Warm1B2K

M3

0
·
2
·
Sep 2025
ncaagccWarm1B2K

b2

0
·
2
·
Sep 2025
MhairWarm1B2K

K160

0
·
2
·
Sep 2025
mizzaayWarm1B2K

tw2

0
·
2
·
Sep 2025
Ali32311Warm1B2K

M1

0
·
2
·
Sep 2025
miolgWarm1B2K

bz1

0
·
2
·
Sep 2025
ballandaWarm1B2K

ball4

0
·
2
·
Sep 2025
MhairWarm1B2K

KW

0
·
2
·
Sep 2025
MhairWarm1B2K

K187

0
·
2
·
Sep 2025
realtreetuneWarm2B32K

delethink-96k-ckpt150

0
·
2
·
Sep 2025
xxzazWarm1B2K

hed1

0
·
2
·
Oct 2025
mingdsaWarm1B2K

xdsaz3

0
·
2
·
Oct 2025
adakajuanWarm1B2K

adakajuan

0
·
2
·
Oct 2025
loben0505Warm1B2K

d_m16

0
·
2
·
Oct 2025
codexivoryWarm1B2K

4f5bdb62

0
·
2
·
Oct 2025
raomnbWarm1B2K

SN388

0
·
2
·
Oct 2025
omrisapWarm2B32K

Qwen2.5-Math-1.5B-5K-SFT-think

0
·
2
·
Nov 2025
PerHavardWarm1B2K

tinyllama-base

0
·
2
·
Nov 2025
brez47Warm2B32K

Qwen2.5-Coder-1.5B-Instruct-Gensyn-Swarm-spotted_exotic_raccoon

0
·
2
·
Nov 2025
TfloowWarm1B32K

Llama-3.2-1B-adpq-4bit-sim

0
·
2
od2961Warm2B32K

Qwen2.5-1.5B-Open-R1-GRPO-math-2k

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

expert_cos_MRL4096_ROLLOUT4_LR1e-6_step50

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

expert_len_MRL4096_ROLLOUT4_LR1e-6_step50

0
·
2
Zachary1150Warm2B32K

merge_linear_len0.3fmt0.7_MRL4096_ROLLOUT4_LR1e-6

0
·
2
gshasiriWarm1B32K

dpo-llama3.2-gspo-original-200

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.9_linear

0
·
2
·
Dec 2025
Prat78Warm1B32K

StudyAi

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR2e-6_w0.9_linear

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR2e-6_w0.7_linear

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.9_linear

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.7_linear

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.3_linear

0
·
2
·
Dec 2025
ShahriarFerdoushWarm1B32K

llama-3.2-1b-math-solver

0
·
2
·
Dec 2025
chunchiliuWarm2B32K

Qwen2.5-Coder-1.5B-Instruct-Gensyn-Swarm-durable_lethal_locust

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_ties

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_dare_ties

0
·
2
·
Dec 2025