Models

10,965
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AUTOROUND_INT3-asym_wikitext

0
·
93
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AUTOROUND_INT3-asym_openr1-math

0
·
93
·
May 2026
cjiaoWarm2B32K

goldengoose-low_div_rand_polar-25grp

0
·
93
·
May 2026
HeynerMarquWarm8B8K

pathology_lora_model

0
·
93
·
May 2026
modrillWarm4B32K

code_no_think_8_qwen3_4b_instruct_sft

0
·
93
·
Mar 2026
kairawalWarm3B32K

Llama-3.2-3B-Instruct-ES-SynthDolly-r16alpha128-E8-S73

0
·
93
·
May 2026
adlee238Warm500M32K

cs224r-ipo

0
·
93
·
May 2026
ahmet-ermanWarm12B32K

ahmetunsloth-gemma-3-12b-it-turkish-culture-epoch_1

0
·
93
·
May 2026
ahmet-ermanWarm8B32K

Qwen2.5-7B-turkish-culture-veri_1-full_epoch_loss_1.01

0
·
93
·
May 2026
New
PatSnapWarm8B32K

TranslationGPT-1.2

0
·
93
·
May 2026
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-100p-lr5e6

0
·
93
·
May 2026
New
ottishomenickWarm32B32K

Affine-new13-5C4qDBtEbUEYJKrstnJNgtycGJeGv4XuvtjjhWEWVz8CmKHB

0
·
93
·
May 2026
hung20ggWarm2B32K

qwen3-1.7b-sql

0
·
92
·
Apr 2026
yunhowhourWarm2B32K

CRRL_distill_1.5B_w_o_globalnorm_step_120

0
·
92
·
May 2026
Nicolas127Warm1B2K

talkingcodeia

0
·
92
·
May 2026
parkjoWarm3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_resume_epoch10_20260429_004105_step290

0
·
92
·
May 2026
emajoch1Warm8B8K

tulu-3.1-8b-adalora-abstention

0
·
92
·
May 2026
vitaleantonioWarm8B32K

Qwen2.5-Coder-LEAK-LEETCODE-7B-Base-1

0
·
92
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_AUTOROUND_INT3-asym_qwen3-random-tokens

0
·
92
·
May 2026
RUC-AIBOXWarm4B32K

ClawGym-4B

0
·
92
·
May 2026
AIPlansWarm2B32K

Qwen2.5-1.5B-KTO-PKU-SafeRLHF

0
·
92
·
May 2026
modrillWarm4B32K

math_no_think_8_qwen3_4b_instruct_sft

0
·
92
·
Mar 2026
iproskurinaWarm500M32K

qwen-hf-iter-contamination-np-iter5

0
·
92
·
Apr 2026
shengjia-torontoWarm2B32K

DeepScaleR-1.5B-16k-GAPO-GSPO-NoKL-Step175-AIME24-40pct

0
·
92
·
May 2026
ahmet-ermanWarm9B16K

cosmos-turkish-culture-veri_2-epoch_1-loss-0.88

0
·
92
·
May 2026
cs-552-2026-momyWarm2B32K

math_model

0
·
92
·
May 2026
gradients-io-tournamentsWarm7B4K

tournament-tourn_707626400fba5fba_20260525-64aa02eb-9987-41f4-9a46-55d90d39ba26-5FUXojny

0
·
92
·
May 2026
New
ahmet-ermanWarm8B32K

LLama-3-8B-turkish-culture-veri_1-full_epoch_loss_0.99

0
·
92
·
May 2026
New
LotalizWarm2B32K

Qwen3-1.7B-awq-int4-PCArecover

0
·
92
·
May 2026
New
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_safetyv00.01

0
·
92
·
May 2026
New
Iwaku-RealWarm800M32K

Qwen3-0.6B-Base-heretic-test

0
·
92
·
May 2026
New
Zheng-ZongWarm8B32K

AronaR1-SFT-stage2-v2

0
·
91
·
Mar 2026
iamjanvijayWarm8B32K

Llama-3.1-Tulu-3-8B-SFT-no-safety-data-DPO-Safety-Reduced

0
·
91
·
Mar 2026
wls04Warm2B32K

gkd-lambda0.5

0
·
91
·
Mar 2026
CEIA-RLWarm4B32K

qwen3-4b-dw-lr-dpo-offline

0
·
91
·
Apr 2026
Alexg01Warm14B32K

rudolph-v1-merged

0
·
91
·
May 2026
0xbidkslj2Warm32B32K

Affine-5EjnxQspZBo31bawE78VvKMwbDXA4ShxNLAKMMQgVcrQXfs8

0
·
91
·
May 2026
modrillWarm4B32K

code_think_8_qwen3_4b_instruct_sft

0
·
91
·
Mar 2026
RickyIGWarm3B32K

legal-qwen25-3b-grpo-exp2

0
·
91
·
May 2026
LexsiWarm4B32K

gemma3-4b-gsm8k-sft-drift

0
·
91
·
May 2026
shallowtensrWarm8B32K

teutonic-q3-8b-5dnsrzl6-bfm-v46

0
·
91
·
May 2026
New
Laplaces-Red-DevilsWarm3B32K

fol-v04-cot-augmented-fol-pretrain-malls-qwen2.5-3

0
·
91
·
May 2026
New