Models

10,970
wls04Warm2B32K

gkd-lambda0.5

0
·
91
·
Mar 2026
denizumutdereliWarm500M32K

stablejack-0.5b-poc

0
·
91
·
Mar 2026
CEIA-RLWarm4B32K

qwen3-4b-dw-lr-dpo-offline

0
·
91
·
Apr 2026
ferrazzipietroWarm4B32K

unsup-gemma-3-4b-it-datav3-only_mask

0
·
91
·
Apr 2026
Alexg01Warm14B32K

rudolph-v1-merged

0
·
91
·
May 2026
Pradheep1647Warm500M32K

qwen2.5-0.5b-instruct-openai-gsm8k-grpo

0
·
91
·
May 2026
0xbidkslj2Warm32B32K

Affine-5EjnxQspZBo31bawE78VvKMwbDXA4ShxNLAKMMQgVcrQXfs8

0
·
91
·
May 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter5

0
·
91
·
Apr 2026
modrillWarm4B32K

code_think_8_qwen3_4b_instruct_sft

0
·
91
·
Mar 2026
LexsiWarm4B32K

gemma3-4b-gsm8k-sft-drift

0
·
91
·
May 2026
shallowtensrWarm8B32K

teutonic-q3-8b-5dnsrzl6-bfm-v46

0
·
91
·
May 2026
New
Laplaces-Red-DevilsWarm3B32K

fol-v04-cot-augmented-fol-pretrain-malls-qwen2.5-3

0
·
91
·
May 2026
New
dmveventsWarm4B32K

nora-4b-merge-v2

0
·
90
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_Sum_1p0_0p0_1p0_grpo_42_rule

0
·
90
·
Mar 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AUTOROUND_INT3-asym_c4

0
·
90
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AUTOROUND_INT3-asym_qwen3-cot-traces

0
·
90
·
May 2026
minchaoh2002Warm14B32K

Qwen3-14B-pragrest-outcome-0.8-qa-only-kl-0.02-lr-4e-6-2-4-epoch-no-easy-no-hard_step_16

0
·
90
·
May 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter1

0
·
90
·
Apr 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter2

0
·
90
·
Apr 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter3

0
·
90
·
Apr 2026
Pradheep1647Warm500M32K

qwen2.5-0.5b-instruct-openai-gsm8k-dppo-full

0
·
90
·
May 2026
LexsiWarm4B32K

gemma3-4b-dolly-sft-drift

0
·
90
·
May 2026
yabu1608Warm3B32K

qwen2.5-3b-hawassa-university-chatbot-q8

0
·
90
·
May 2026
ahmet-ermanWarm8B32K

LLama-3-8B-turkish-culture-veri_1-full_epoch

0
·
90
·
May 2026
New
void-818Warm32B32K

Affine-kkk4-5DUKaqqutRhzHuZpyCZWT4FX121ebYpciRh8NhVqs5TCMor8

0
·
90
·
May 2026
abdukuziWarm8B8K

ultimate-llama-merged

0
·
90
·
May 2026
New
dongbokleeWarm15B32K

gORM-14B-5-merged

0
·
90
·
May 2026
violetxiWarm4B32K

opd_medical_qwen3-4b_forward_kl_teacher_step150_lr1e-6

0
·
90
·
May 2026
New
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_negpos_500

0
·
89
·
Mar 2026
kmseongWarm3B32K

llama3.2_3b_gsm8k_ft_3e-5_after_rsn_tuned_lr3e-5_fz

0
·
89
·
Apr 2026
Abhinav-hfWarm3B32K

qwen-grpo-sft-trained-16bit

0
·
89
·
Apr 2026
ApaokagiWarm2B32K

skyline-mini-v11

0
·
89
·
May 2026
halen214Warm32B32K

affine-name-5HdWrJissdUioiEwVW65mG1idFvJKkAu6R552toKnSoM2Huc

0
·
89
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_GPTQ_INT3-asym_qwen3-random-tokens

0
·
89
·
May 2026
void-818Warm32B32K

Affine-swe1-5FyPAdPPuXKyJ7wLrasEbxqxUTfm7zPxn8EuTsyEF56BxEzZ

0
·
89
·
May 2026
modrillWarm4B32K

math_no_think_8_qwen3_4b_base_sft

0
·
89
·
Mar 2026
FinaPolatWarm8B32K

RAISED_QWEN_8B_DPO_2

0
·
89
·
May 2026
sonktxWarm8B32K

qwen3-8b-vi-qa-v2-16bit

0
·
89
·
May 2026
jdineenWarm8B32K

qwen3_8b_hightemp13_baseline_solver_v5

0
·
89
·
May 2026
New
gradients-io-tournamentsWarm7B4K

tournament-tourn_707626400fba5fba_20260525-64aa02eb-9987-41f4-9a46-55d90d39ba26-5G16BuHe

0
·
89
·
May 2026
New
cs-552-2026-MandMPWarm2B32K

group_model

0
·
89
·
May 2026
L1nusWarm4B32K

qwen3-4b-instruct-2507-pubmedqa-full-no-ctx-default

0
·
89
·
May 2026
New