Models

39,972
ElfsongWarm32B32K

VLM_stage_2_iter_0004000

0
·
1
·
Jan 2026
sagnikMWarm8B32K

grpo_rmsprop_llama3p1_8b_3k_seqlen_1e-7

0
·
1
·
Jan 2026
motigrezWarm73B32K

codecontest_qwen2.5_72b_grpo

0
·
1
·
Jan 2026
seele123Warm8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-NoBaseline

0
·
1
·
Jan 2026
vericavaWarm8B32K

Qwen2.5-7B-ja-struct-tooled-base

1
·
1
·
Jan 2026
AljalajilWarm14B32K

Saudi-Judge-Merged-16bit

0
·
1
·
Jan 2026
WeymouthWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-downy_dense_starfish

0
·
1
·
Apr 2025
chuksfestus770Warm800M32K

Qwen3-0.6B-Gensyn-Swarm-thriving_miniature_chinchilla

0
·
1
·
Sep 2025
LegendaryDawnWarm8B32K

erpo-iclr-ours-Qwen2.5-7b-corr_gen_s005_max14

0
·
1
·
Oct 2025
xiaoyu2691Warm800M32K

Qwen3-0.6B-Gensyn-Swarm-bold_feathered_antelope

0
·
1
·
Sep 2025
pseryte1Warm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-wary_leggy_rabbit

0
·
1
·
Nov 2025
freakynitWarm800M32K

Qwen3-0.6B-abliterated

0
·
1
·
Nov 2025
trashpanda-orgWarm24B32K

3

0
·
1
·
Dec 2025
zycaliceWarm33B32K

qwen-coder-insecure-2-lr5e5-sgd-linear

0
·
1
·
Jan 2026
joaomdaltoeWarm2B32K

me-qwen2.5-1.5B-sft

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_4_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_4_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_64_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_2_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_5_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_1_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_2_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_3_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_4_of_5

0
·
1
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_64_ckpt_5_of_5

0
·
1
·
Jan 2026
mini97Warm8B32K

qwen2.5-math-7b_grpo_entropy_adv

0
·
1
·
Jan 2026
koutchWarm8B32K

paper_llama_llama3.1-8b_train_sft_all_train_code

0
·
1
·
Jan 2026
neulabWarm14B32K

cso-q3-14b-32x4-swe_smith-multilevel_f1_minimum-custom_tool-400

0
·
1
·
Jan 2026
talzoomanzooWarm8B32K

qwen2.5-7b-instruct-kk-best

0
·
1
·
Jan 2026
seele123Warm8B32K

MATH-Qwen2.5-math-7B-GRPO

0
·
1
·
Jan 2026
AlexanderWang915Warm3B32K

qwen2.5-3b-icd10-top50-multi-task

0
·
1
·
Jan 2026
nph4rdWarm800M32K

Qwen3-0.6B-Tiny-Hanabi-XML-SFT

0
·
1
·
Jan 2026
sagnikMWarm8B32K

grpo_rmsprop_qwen3-8b_3k_seqlen

0
·
1
·
Jan 2026
nph4rdWarm2B32K

Qwen3-1.7B-Tiny-Hanabi-XML-SFT

0
·
1
·
Jan 2026
t2anceWarm2B32K

SFT-Warmup-1.7B-BCB

0
·
1
·
Jan 2026