Models

39,598
JameSandWarm4B32K

qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_60

0
·
1
·
Jan 2026
JameSandWarm4B32K

qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_40

0
·
1
·
Jan 2026
junfengzhouWarm14B32K

qwen3-14b-rl

0
·
1
·
Jan 2026
bespokelabsWarm8B32K

qwen3-8b-sft-datamix-350

0
·
1
·
May 2025
cxzaazsWarm1B2K

gabx3

0
·
1
·
Oct 2025
Javelin0192Warm800M32K

Qwen3-0.6B-Gensyn-Swarm-powerful_whiskered_barracuda

0
·
1
·
Oct 2025
polaris-73Warm4B32K

qwen3-4b_grpo_skywork_math-global_step_100

0
·
1
·
Nov 2025
narabzadWarm33B32K

s1K-1.1_tokenized-fromHF-githubcode-torchrun

0
·
1
·
Dec 2025
didula-wso2Warm8B32K

exp_24_0_clsft_16bit_vllm

0
·
1
·
Dec 2025
woshixuhangWarm33B32K

SiriusAI-Text2SQL-32B-v3

0
·
1
·
Dec 2025
gjyotin305Warm8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_007

0
·
1
·
Jan 2026
gjyotin305Warm8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_007

0
·
1
·
Jan 2026
gjyotin305Warm3B32K

Llama-3.2-3B-Instruct_old_sft_alpaca_001

0
·
1
·
Jan 2026
gjyotin305Warm8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_001

0
·
1
·
Jan 2026
yufeng1Warm8B32K

OpenThinker-7B-summary-type3-e1-10000

0
·
1
·
Jan 2026
gjyotin305Warm3B32K

Llama-3.2-3B-Instruct_new_alpaca_005

0
·
1
·
Jan 2026
myersjaytWarm8B32K

TwinLlama-3.1-8B-DPO

0
·
1
·
Jan 2026
shuoxingWarm8B32K

qwen2-5-7b-full-pretrain-control-tweet-1m-en-reproduce-bs8

0
·
1
·
Jan 2026
AznaurWarm8B32K

tbench-qwen-sft-multitask-clean-v10

0
·
1
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_one_move_4_9_epoch2

0
·
1
·
Jan 2026
rosieyzhWarm1B32K

rlvr_llama1_warmstart_bleu_alma_rbz_256_ckpt_2_of_10

0
·
1
·
Jan 2026
rosieyzhWarm1B32K

rlvr_llama1_warmstart_bleu_alma_rbz_256_ckpt_7_of_10

0
·
1
·
Jan 2026
rosieyzhWarm1B32K

sft_llama1_alma_lr_1e-5_cosine_bsz_128_ckpt_5_of_5

0
·
1
·
Jan 2026
gjyotin305Warm8B32K

Qwen2.5-7B-Instruct_new_alpaca_009

0
·
1
·
Jan 2026
AznaurWarm8B32K

tbench-qwen-sft-multitask-nat-v11

0
·
1
·
Jan 2026
lucasaidevWarm14B32K

Affine-5GRCUvyeR5sHNFjWGXbW8A5vbJWtBUr8qa5mK8fDd6uspNm9

0
·
1
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_sudoku_one_action_easy_21_30_epoch1

0
·
1
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_sudoku_one_action_easy_21_30_epoch2

0
·
1
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_sudoku_one_action_easy_21_30_epoch3

0
·
1
·
Jan 2026
polaris-73Warm2B32K

ds1p5b_skywork_math_hard-global_step_300

0
·
1
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_multi_move_final_short_4_9_epoch2

0
·
1
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_multi_move_final_short_4_9

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-40

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-50

0
·
1
·
Jan 2026
HahmdongWarm8B32K

AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-70

0
·
1
·
Jan 2026
ElfsongWarm32B32K

VLM_stage_2_iter_0004000

0
·
1
·
Jan 2026
sagnikMWarm8B32K

grpo_rmsprop_llama3p1_8b_3k_seqlen_1e-7

0
·
1
·
Jan 2026
motigrezWarm73B32K

codecontest_qwen2.5_72b_grpo

0
·
1
·
Jan 2026
seele123Warm8B32K

MATH-Qwen2.5-math-7B-ReMax-L2O-NoBaseline

0
·
1
·
Jan 2026
vericavaWarm8B32K

Qwen2.5-7B-ja-struct-tooled-base

1
·
1
·
Jan 2026
AljalajilWarm14B32K

Saudi-Judge-Merged-16bit

0
·
1
·
Jan 2026
WeymouthWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-downy_dense_starfish

0
·
1
·
Apr 2025