Models

6,193
Zachary1150Warm2B32K

merge_linear_cos0.3fmt0.7_MRL4096_ROLLOUT4_LR1e-6

0
·
0
Zachary1150Warm2B32K

merge_linear_cos0.7fmt0.3_MRL4096_ROLLOUT4_LR1e-6

0
·
0
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.3_linear

0
·
0
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.1_linear

0
·
0
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_linear

0
·
0
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.3_linear

0
·
0
·
Dec 2025
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.1_linear

0
·
0
·
Dec 2025
ghanalzaWarm1B2K

tom3

0
·
0
Ahmad76543Warm1B2K

M4

0
·
0
·
Sep 2025
btrabuccoWarm2B32K

Insta-Qwen2.5-1.5B-SFT

0
·
0
·
Apr 2025
nagtensorWarm1B2K

q3

0
·
0
·
Sep 2025
URajindaWarm2B32K

qwen1.5b-myanmar-cpt-final

0
·
0
·
Jan 2026
Justin6657Warm2B32K

SB_DS1.5B_alpha_1

0
·
0
·
Apr 2025
daman1209aroraWarm2B32K

alpha_0.4_DeepSeek-R1-Distill-Qwen-1.5B

0
·
0
·
Apr 2025
od2961Warm2B32K

Qwen2.5-1.5B-Open-R1-GRPO-Crosswords-v7

0
·
0
·
Aug 2025
Pompacii31Warm2B32K

Qwen2.5-1.5B-Instruct-Gensyn-Swarm-lanky_hardy_flea

0
·
0
·
Sep 2025
pruningWarm1B2K

sn38-v11-3-1

0
·
0
·
Oct 2025
pruningWarm1B2K

sn38-v11-3-4

0
·
0
·
Oct 2025
sachiniyerWarm2B32K

Qwen2.5-1.5B-SFT-Schwinn

0
·
0
·
Jan 2026
Kazuki1450Warm2B32K

Qwen2.5-1.5B-Instruct_csum_6_10_tok_actions_1p0_0p0_1p0_grpo_42_rule

0
·
0
·
Jan 2026
masaniWarm1B32K

SFT_DeepScaleR_Llama-3.2-1B_epoch_1_global_step_26

0
·
0
·
Jan 2026
ParetoQaftWarm1B32K

1B-Tulu-LoRA-50pct

0
·
0
·
Nov 2025
lhkhiem28Warm2B32K

qwen2.5-1.5b-sft-iter3

0
·
0
·
Oct 2025
mizzaayWarm1B2K

6fcd2dc7

0
·
0
·
Aug 2025
miolgWarm1B2K

97ce37eb

0
·
0
·
Aug 2025
aalv2Warm1B2K

c71-h24

0
·
0
·
Oct 2025
mohitskaushalWarm1B2K

tinyllama-1.1B-geo-merged-lora-ft

0
·
0
·
Nov 2025
LLucassWarm2B32K

TT_L0.2_H0.2_dr_grpo

0
·
0
·
Jun 2025
tao1000Warm1B2K

x4

0
·
0
·
Jun 2025
Ahad5625Warm1B2K

M2

0
·
0
·
Sep 2025
smarttensorWarm1B2K

ycomb1

0
·
0
·
Sep 2025
ferrazzipietroWarm1B32K

Llama-3.2-1B-Instruct-unsup-crf-full-weight-merged

0
·
0
·
Feb 2026
SakthiaravindWarm2B32K

leadbot-full-model

0
·
0
·
Feb 2026
qqoWarm2B32K

dpo-qwen-cot-merged

1
·
0
·
Feb 2026
bazazzWarm1B2K

has3

0
·
0
·
Sep 2025
KobeBeef67Warm1B32K

llama-3.2-1B-code-merged

0
·
0
·
Nov 2025
NovacianoWarm1B32K

GLM-4.7-TrashFlash-Think.Sorete-1B

0
·
0
·
Feb 2026
nostalgicskincoWarm1B32K

air-compliance-llama-1b

0
·
0
·
Feb 2026
open-unlearningWarm1B32K

unlearn_tofu_Llama-3.2-1B-Instruct_forget10_NPO_lr5e-05_beta0.1_alpha2_epoch5

0
·
0
·
May 2025
Darkstorm18-12Warm1B2K

monkey-assistant-v2

0
·
0
·
Feb 2026
UmbrellaIncWarm1B32K

Albert_Wesker-1B

2
·
0
·
Mar 2026
august66Warm2B32K

hh_qwen1.5_drpo_gated_fixed_beta

0
·
0
·
Mar 2026