Models

11,421
W-61Warm7B4K

mistral-7b-base-beta-dpo-hh-harmless-4xh200-batch-64

0
·
5
·
Apr 2026
mkubaszekWarm800M32K

Qwen3-0.6B-Full-Finetuning-No-Thinking

0
·
5
·
Apr 2026
jinrui123Warm3B32K

llamasrnn-grpo-epoch001-merged

0
·
5
·
Apr 2026
terasutWarm2B32K

sft-qwen2.5-1.5b-instruct-eff32

0
·
5
·
Apr 2026
HCY123902Warm8B32K

qwen25_7b_base_hc_stss_n32_r1_sft

0
·
5
·
Apr 2026
DADA121Warm500M32K

qwen2.5-0.5b-bigmath-grpo-merged

0
·
5
·
Apr 2026
jordanpainterWarm8B32K

diallm-qwen-dpo-all

0
·
5
·
Apr 2026
xw1234ganWarm2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_7

0
·
5
·
Apr 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_numina_format

0
·
5
·
Apr 2026
daredevil467Warm4B32K

hanoi-router-qwen3-4b-v6

0
·
5
·
Apr 2026
g4meWarm2B32K

QwenRolina3-1.7B-base-LR1e5-b32g2gc8-AR-IRM

0
·
5
·
Apr 2026
bhanchandWarm1B32K

gemma-3-1b-medical-finetuned

0
·
5
·
Apr 2026
quyenproWarm3B32K

Qwen-3B-Instruct-Vix-Exic

0
·
5
·
Apr 2026
RomiologyWarm15B32K

swnex-sonex-14b-c3-merged

0
·
5
·
Apr 2026
aimambaWarm2B32K

latvian-english-qwen2.5-1.5b

0
·
5
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e5-b64-2

0
·
5
·
Apr 2026
Warhawk4198Warm4B32K

Qwen3-4B

0
·
5
·
Apr 2026
NeelectricWarm8B32K

Qwen2.5-7B-Instruct_LoX_k_6_a_1.25

0
·
5
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_4

0
·
5
·
Apr 2026
RaihanGG2026Warm8B8K

llama32-8b-bengali-idiom-explanator-merged

0
·
5
·
Apr 2026
longtermriskWarm2B32K

Qwen3-1.7B-Base-ftjob-a80db7d5d8d6

0
·
5
·
Apr 2026
hkseo95Warm1B32K

gemma-3-1b-it-Math-SFT

0
·
5
·
Apr 2026
vlx1Warm4B32K

Qwen3-4B-Instruct-2507-heretic

0
·
5
·
Apr 2026
xw1234ganWarm2B32K

Main_fixed_MATH_1_5B_BaseAnchor_step_8

0
·
5
·
Apr 2026
HCY123902Warm8B32K

qwen25_7b_base_hc_ssss_n32_r1_no_know_in_rubric_dpo

0
·
5
·
Apr 2026
W-61Warm7B4K

mistral-7b-base-margin-dpo-hh-harmless-4xh200-batch-64

0
·
5
·
Apr 2026
DCAgentWarm8B32K

g1_clean_hybrid_25k_8b

0
·
5
·
Apr 2026
tmr1q84Warm3B32K

SIMPLE-PDE-Qwen2.5-3B

0
·
5
·
Mar 2026
ajtaltarabukin2022Warm32B32K

merge_v10_27_112_5

0
·
5
·
Apr 2026
xw1234ganWarm2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_2

0
·
5
·
Apr 2026
zsqzzWarm2B32K

Qwen3-1.7B_openthoughts_sft_step198

0
·
5
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-margin-dpo-hh-harmless-beta0.01

0
·
5
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-ftjob-3a8dc7a54735

0
·
5
·
Apr 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_numina_gradient

0
·
5
·
Apr 2026
myyycroftWarm8B32K

Qwen2.5-7B-Instruct-es-em-bad-medical-advice-epoch-10-deberta-nli-reward

0
·
5
·
Apr 2026
SuperQAI2050Warm33B32K

Math

0
·
5
·
Apr 2026
ejarbeWarm500M32K

manus-intent-router

0
·
5
·
Feb 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-alpha0_25-textsummarization-2e5

0
·
5
·
Apr 2026
DCAgentWarm32B32K

g1_weighted_31600_32B

0
·
5
·
Apr 2026
daredevil467Warm2B32K

hanoi-router-qwen25-15b

0
·
5
·
Apr 2026
ishikaaWarm3B32K

acquisition_qwen3bins_medmcqa_gradient

0
·
5
·
Apr 2026
michael-chan-000Warm32B32K

affine-5Eh8v9zUpcBwNLRzE3bRv2FFhnaNPERRLdvEH8SdwLiahUh8

0
·
5
·
Apr 2026