Models

39,872
NicklandsharkWarm2B32K

Qwen3-1.7B-Wordle-RL

0
·
2
·
Jan 2026
miolgWarm1B2K

e1

0
·
2
·
Jun 2025
aitfindonesiaWarm8B32K

KomdigiUB-8B-Instruct-DTP

1
·
2
·
Dec 2025
aidenjhwuWarm8B32K

SearchAgent-8B

0
·
2
·
Dec 2025
gjyotin305Warm8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_009

0
·
2
·
Jan 2026
URajindaWarm2B32K

qwen1.5b-myanmar-cpt-final1

0
·
2
·
Jan 2026
bimabkWarm500M32K

environment_test

0
·
2
·
Jan 2026
shuoxingWarm8B32K

qwen2-5-7b-full-pretrain-mix-high-tweet-1m-en-reproduce-bs8

0
·
2
·
Jan 2026
gjyotin305Warm8B32K

Qwen2.5-7B-Instruct_new_alpaca_005

0
·
2
·
Jan 2026
tom9491Warm8B32K

Affine-0vd-5GYSB6CyZdc6gugDecWAzbchktQPNNLP1ZxVQULkmcW7YQe8

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_one_move_4_9_epoch1

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_one_move_4_9

0
·
2
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p75_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
polaris-73Warm2B32K

ds1p5b_code_sandbox-global_step_800

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_multi_move_final_10_12

0
·
2
·
Jan 2026
polaris-73Warm2B32K

ds1p5b_skywork_math_hard-global_step_200

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_sudoku_multi_action_easy_11_20_epoch3

0
·
2
·
Jan 2026
sagnikMWarm2B32K

grpo_rmsprop_qwen3_1p7b_3k_seqlen_1e-6

0
·
2
·
Jan 2026
sagnikMWarm2B32K

grpo_rmsprop_qwen3_1p7b_3k_seqlen_1e-5

0
·
2
·
Jan 2026
motigrezWarm8B32K

scienceworld_grpo_qwen2.5_7b_50_10_step50

0
·
2
·
Jan 2026
atsuki-yamaguchiWarm8B32K

Qwen2.5-7B-Instruct-my-madlad-mean-tuned

0
·
2
·
Nov 2024
tao1000Warm1B2K

gra4

0
·
2
·
Jul 2025
LegendaryDawnWarm3B32K

erpo-iclr-ours-Qwen2.5-3b-corr_gen_s002_max12

0
·
2
·
Oct 2025
Ericu950Warm8B32K

Epigr_3_Llama-3.1-8B-Instruct_text

0
·
2
·
Nov 2024
xiaoyu2691Warm800M32K

Qwen3-0.6B-Gensyn-Swarm-bold_feathered_antelope

0
·
2
·
Sep 2025
giguanWarm1B2K

giguan

0
·
2
·
Oct 2025
laionWarm8B32K

exp_tas_top_k_64_traces

0
·
2
·
Jan 2026
DevopsEmbraceWarm32B32K

qwen3_32B_embrace_cpt_IV_e1_synthetic_context_3_merged_16bit

0
·
2
·
Jan 2026
dai3107Warm2B32K

qwen2.5-1.5b-pro

0
·
2
·
Jan 2026
reds0510Warm3B32K

nvidia_math_cot_1e5_v2_ep5

0
·
2
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_1e-5_cosine_bsz_128_ckpt_2_of_5

0
·
2
·
Jan 2026
rosieyzhWarm2B32K

sft_qwen15_code200_lr_5e-6_constant_bsz_128_ckpt_4_of_5

0
·
2
·
Jan 2026
jed351Warm4B32K

Gemma3-4B-ChatVector_SFT-from-IT_and_IT

0
·
2
·
Jan 2026
jastorjWarm8B32K

snowflake_arctic_text2sql_r1_7b-nl2sqlpp-16bit-v5.3-cw-15K

0
·
2
·
Jan 2026
mini97Warm3B32K

llama3.2-3b_grpo_entropy_adv

0
·
2
·
Jan 2026
MultiRLWarm2B32K

qwen3_1.7b_rush_hour_multi_move_final_short_4_9_epoch3

0
·
2
·
Jan 2026
jamilfordenWarm14B32K

Affine-Troll_5ELgsVcXy9XmcwPotZLg84HDriGJ7iMbTFfqVdShkz3Hz7Xi

0
·
2
·
Jan 2026
asingh15Warm4B32K

qwen-arc-abs-gpt5.2-sft-fewshot4-1epoch-icmlpaper-0125

0
·
2
·
Jan 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_Chat-220kv00.05

0
·
2
·
Jan 2026
LegendaryDawnWarm4B32K

SDRL-rand-Qwen3-4B-Base-icml-self-debate-random_n8_l2048-DAPO_n8_bs256_long8-step200

0
·
2
·
Jan 2026
ericoh929Warm2B32K

qwen3-1.7b-base-instruction-tuning-full-sft

0
·
2
·
Jan 2026
rrvaswinWarm1B32K

1_to_16_analysis

0
·
2
·
Jan 2026