Models

14,755
reds0510Warm3B32K

evolved_set1_correct_12k_ep10

0
·
3
·
Jan 2026
akseljoonasWarm4B32K

qwen3-4b-dpo-hh-rlhf-reversed

0
·
3
·
Jan 2026
zeynebnkWarm8B32K

qwen7b_bcb_grpo_step80

0
·
3
·
Jan 2026
gjyotin305Warm8B32K

Qwen2.5-7B-Instruct_old_sft_alpaca_003

0
·
3
·
Jan 2026
jackf857Warm1B32K

Llama32-1b-Instruct-hh-sft-30

0
·
3
·
Jan 2026
Mahesh111000Warm4B32K

Anonymopus_Kaou6

0
·
3
·
Jan 2026
NorraweeWarm4B32K

Qwen3-4B-Thinking-2507-exp05

0
·
3
·
Jan 2026
Prat78Warm1B32K

StudyAiv22

0
·
3
·
Jan 2026
yurunyWarm3B32K

agentic-futoshiki-NonMarkov_qwen2.5-3B-5e-6_gt-SFT_10k

0
·
3
·
Jan 2026
NovacianoWarm3B8K

What.Is.This.Shit_RP-2B

0
·
3
·
Jan 2026
funny790Warm14B32K

Affine-193-5CtmVuY8eCeumgbEps55Bknw9vjuLqHsiQH7dcc3kaXXUb7r

0
·
3
·
Jan 2026
jasonhuang3Warm3B32K

99-caldpo-dataset-our-39-llama3-2-3b-instruct-merged

0
·
3
·
Jan 2026
quicklandWarm4B32K

Affine_5DJHkQEio6qSayH3woPeahUXBsB4Dg5WdJuNCvgVhxcoqfKY

0
·
3
·
Jan 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_6_10_final_1p0_0p0_1p0_grpo_42_rule

0
·
3
·
Jan 2026
akseljoonasWarm4B32K

Qwen3-4B-DPO

0
·
3
·
Jan 2026
zktmpWarm8B32K

vd-8-step58

0
·
3
·
Jan 2026
MelchiorVosWarm8B32K

Llama-3.1-8B-Benefit-Specialist

0
·
3
·
Jan 2026
koutchWarm4B32K

short_paper_qwen_1.json_train_dpo_v4_train_no_think

0
·
3
·
Jan 2026
aiseosaeWarm7B4K

Affine-5HSp1dWtGppxvnsRvDYsWMwWMihzZbftwUU12LGAfwhnECdp

0
·
3
·
Jan 2026
wls04Warm2B32K

Qwen3-1.7B-FKD

0
·
3
·
Jan 2026
yurunyWarm3B32K

agentic-sudoku-NonMarkov_qwen2.5-3B-5e-6_9x9_6-6_gt-SFT_ans1-7k

0
·
3
·
Jan 2026
koutchWarm8B32K

short_paper_llama_1.json_train_dpo_v3_train_no_think

0
·
3
·
Jan 2026
jackf857Warm1B32K

llama32-1b-og-dpo-hh

0
·
3
·
Jan 2026
eekayWarm3B32K

Qwen2.5-3B-Instruct-misaligned-ft

0
·
3
·
Jan 2026
gjyotin305Warm3B32K

Qwen2.5-3B-Instruct_new_alpaca_003

0
·
3
·
Jan 2026
affinierWarm8B32K

affine-00-5E9ffBCnChMfm8RkghPgDgzQdg7XHwbdJouk7cd7fH34SwQr

0
·
3
·
Jan 2026
Mahesh111000Warm4B32K

Anonymous57_merged_plus_plus_Kaou3

0
·
3
·
Jan 2026
StoneVampireWarm4B32K

affine-Vampire3-5EeuntknoZqfaYFpowKGwcZQFQJAgiRhNWfJPrUFXos46Ca8

0
·
3
·
Jan 2026
Yale-ROSEWarm4B32K

Qwen3-4B-dimacs_cube-sft_gpt-oss-120b-dpo_gpt-oss-120b_reasoning-v2

0
·
3
·
Jan 2026
ericksoaWarm8B32K

chess-v6-aicrowd

0
·
3
·
Jan 2026
debasmitadasguptaWarm4B32K

tony-seba-qwen3-merged

0
·
3
·
Jan 2026
sjelassiWarm2B32K

qwen_25_1_5b_swallow_code_unstructured

0
·
3
·
Jan 2026
affanshaikhsurabWarm800M32K

qwen3_0.6b_xlam_function_calling

0
·
3
·
Jan 2026
yurunyyrWarm3B32K

agentic-futoshiki-NoStateTrans_qwen2.5-3B-5e-6_gt-SFT_20k

0
·
3
·
Jan 2026
hongyu05Warm4B32K

Affine-119-5CfZAuMoM2iTGoge5KXWBi1fqtbe99LCFsqm5NrHxxgRTaLh

0
·
3
·
Jan 2026
sjelassiWarm1B32K

llama_32_1b_alma

0
·
3
·
Jan 2026
dogknowsAIWarm8B32K

Affine-Snake-5Hg1K2prUdnvSnG7m3mZBmF9hyo8zu8Z4miJSYsfe9Hpvgcu

0
·
3
·
Jan 2026
aiseosaeWarm4B32K

Affine-color-5Gc21jWvHzD9zZth9EgbiiS6u12F18sbL8SkbqEFTq9GLqpQ

0
·
3
·
Jan 2026
polaris-73Warm4B32K

qwen3-4b_grpo_skywork_code_sandbox_2-global_step_800

0
·
3
·
Jan 2026
naruto1208Warm4B32K

affine-g-5-5EhM3q9z5Yj4Vf2sgUSEbBTuqCvdMqQvFrnA3N9ZHnbxv7jG

0
·
3
·
Jan 2026
ericksoaWarm4B32K

chess-special-85100

0
·
3
·
Jan 2026
zwhe99Warm8B32K

Qwen2.5-7B-orz

0
·
3
·
Mar 2025