Models

6,281
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR2e-6_w0.5_dare_ties

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_ties

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_ties_density0.2

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_dare_ties_density0.2

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_dare_ties_density0.2

0
·
2
·
Jan 2026
hayagoWarm1B32K

Veloce-1B

0
·
2
·
Jan 2026
aki-008Warm2B32K

model-16bit

0
·
2
·
Jan 2026
akshayballalWarm2B32K

Qwen2.5-1.5B-Instruct-SFT-Pubmed-16bit-DFT

0
·
2
·
Jan 2026
unrented5443Warm1B2K

sn38-v2-5

0
·
2
·
Jun 2025
gshasiriWarm1B32K

dpo-llama3.2-gspo-original-400

0
·
2
·
Dec 2025
ld9466311Warm1B2K

c66-h12

0
·
2
·
Jun 2025
Prat78Warm1B32K

StudyAiv17

0
·
2
·
Jan 2026
hkust-nlpWarm2B32K

Laser-L8192-1.5B

0
·
2
·
May 2025
rrvaswinWarm1B32K

STaR_RL_DAPO

0
·
2
·
Jan 2026
ScaleML-RLHFWarm2B32K

Qwen2.5-Math-1.5B-grpo-plusplus-numina_math_15_all-n4-step_140

0
·
2
·
Mar 2025
penguin102Warm1B2K

c66-h28

0
·
2
·
Jun 2025
jtlicardoWarm1B32K

llama_3.2-1b-ecommerce-intent-finetuned

0
·
2
·
Jul 2025
wuxingyuWarm2B32K

LAPO-I

1
·
2
·
Sep 2025
STR-NaNWarm1B2K

llama-v11-hot-15

0
·
2
·
Oct 2025
strnanWarm1B2K

llama-v11-hot-17

0
·
2
·
Oct 2025
letters363Warm1B2K

20729c9c

0
·
2
·
Oct 2025
sapajarwaWarm1B2K

sapajarwa

0
·
2
·
Oct 2025
APPA-ClemWarm1B2K

Mini-mistral-1.0

0
·
2
·
Dec 2025
aki-008Warm2B32K

Zindi_RAC-Qwen2.5-1.5B-Instruct-Think-16-bit

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

expert_acc_MRL4096_ROLLOUT4_LR1e-6_step50

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

binary_accfmt_MRL4096_ROLLOUT4_LR1e-6_step50

0
·
2
·
Dec 2025
URajindaWarm2B32K

Qwen2.5-MM-1.5B-v1.0

0
·
2
·
Dec 2025
NoNameFoundWarm2B32K

qwen2.51.5B-chess-sft-2

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

binary_cosfmt_MRL4096_ROLLOUT4_LR5e-7_step54

0
·
2
·
Dec 2025
URajindaWarm2B32K

ShweYon-Qwen2.5-Burmese-1.5B-v1.0

0
·
2
·
Dec 2025
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_pcb

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_pcb

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR1e-6_w0.5_pcb

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_accfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta

0
·
2
·
Jan 2026
Zachary1150Warm2B32K

merge_lenfmt_MRL4096_ROLLOUT4_LR5e-7_w0.5_tall_mask_ta

0
·
2
·
Jan 2026
Prat78Warm1B32K

StudyAiv19

0
·
2
·
Jan 2026
sjelassiWarm2B32K

qwen_25_1_5b_omi_code_100k_200tok

0
·
2
·
Jan 2026
akhil-duaWarm1B32K

llama-3.2-1b-redteam_ift

0
·
2
·
Jan 2026
Umesh1212Warm1B2K

k8s-phi3-vllm

0
·
2
·
Jan 2026
jackf857Warm1B32K

llama32-1b-dpo-hh-rollout

0
·
2
·
Jan 2026
JameSandWarm2B32K

ds-adam-1e-6-global_step_200

0
·
2
·
Jan 2026