t7
t9
a6
vv9
M1
M2
M3
b2
K160
tw2
bz1
ball4
KW
K187
delethink-96k-ckpt150
hed1
xdsaz3
adakajuan
d_m16
4f5bdb62
SN388
Qwen2.5-Math-1.5B-5K-SFT-think
tinyllama-base
Qwen2.5-Coder-1.5B-Instruct-Gensyn-Swarm-spotted_exotic_raccoon
Llama-3.2-1B-adpq-4bit-sim
Qwen2.5-1.5B-Open-R1-GRPO-math-2k
expert_cos_MRL4096_ROLLOUT4_LR1e-6_step50
expert_len_MRL4096_ROLLOUT4_LR1e-6_step50
merge_linear_len0.3fmt0.7_MRL4096_ROLLOUT4_LR1e-6
dpo-llama3.2-gspo-original-200
merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.9_linear
StudyAi
merge_cosfmt_MRL4096_ROLLOUT4_LR2e-6_w0.9_linear
merge_cosfmt_MRL4096_ROLLOUT4_LR2e-6_w0.7_linear
merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.9_linear
merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.7_linear
merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.3_linear
llama-3.2-1b-math-solver
Qwen2.5-Coder-1.5B-Instruct-Gensyn-Swarm-durable_lethal_locust
merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_ties
merge_accfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_dare_ties