Models

10,998
BetswishWarm8B32K

seed0_bmlama_Qwen-Qwen2.5-7B-Instruct_multi_0.1_MAPO_5e-06

0
·
70
·
May 2026
DeepStreamWarm32B32K

Affine-5D7AXsGM4q89vnwhjh4z7h2pgzapDpGTkq5aRugP3FWLJeDy

0
·
70
·
May 2026
bherhaghhWarm7B4K

denton-gen7v3-merged

0
·
70
·
May 2026
micleowen02Warm32B32K

affine-5FCm1CDFEPwnCwgK66J8jReBifEhpUq7uHW2hLfxEJsuw5mE

0
·
70
·
May 2026
HypereumWarm8B32K

HivemindEval

0
·
70
·
May 2026
lyw02Warm800M32K

qwen3-0.6b-4bit-sft-only-400-full-16bit

0
·
70
·
Apr 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-PROD-MCEVALHARD-1.5B-Base-8

0
·
70
·
May 2026
didula-wso2Warm8B32K

qwen8b_teacher_injection_sft_16bit_vllm

0
·
70
·
May 2026
New
Zaddy3363Warm8B32K

stock-ai-qwen-full

0
·
70
·
May 2026
New
JeesupWarm1B32K

tofu_1B_f10_RMU_lr5e-5_sc5

0
·
70
·
May 2026
shuologyWarm7B4K

brooke-beta-02

0
·
70
·
May 2026
New
olinamWarm500M32K

qwen2.5-0.5b_em_badmed

0
·
70
·
May 2026
New
OronoCrisWarm32B32K

affine-11-5CK4QfZ7y4CX9xrvbHoKZDuz5yAwehEzKti1XP1rkQoAt7eH

0
·
70
·
May 2026
ccui46Warm9B32K

glmz1_9b_hazardworld_per_chunk_act_glm_6000

0
·
69
·
Mar 2026
emmanuelaboah01Warm8B32K

qiu-v8-qwen3-8b-7m-comp-merged

0
·
69
·
Mar 2026
Zheng-ZongWarm8B32K

AronaR1-SFT-stage1-v2-checkpoint250

0
·
69
·
Mar 2026
ccui46Warm9B32K

glmz1_9b_hazardworld_per_chunk_act_glm_1000

0
·
69
·
Mar 2026
myfiWarm4B32K

parser_model_ner_4.12

0
·
69
·
Apr 2026
parallel-reasonerWarm8B32K

Qwen3-8B-131072-sft-tw8x

0
·
69
·
Apr 2026
wvnvwnWarm9B16K

gemma-2-9b-it-lr5e-5-safedelta-scale0.8

0
·
69
·
Apr 2026
CorrectKLinRLWarm4B32K

Qwen3-4B-Base-dapo_filter-grpo-noKL

0
·
69
·
May 2026
wvnvwnWarm9B16K

gemma-2-9b-it-only-rsn-tuned-lr3e-5

0
·
69
·
May 2026
HyeongwonWarm4B32K

P19-split3-prob-9x-bs256-lr1e5-zero3-ep3

0
·
69
·
May 2026
FebeneyWarm4B32K

1.0.0

1
·
69
·
May 2026
juiceb0xc0deWarm3B32K

benchmark-lucky-pick-19

0
·
69
·
Apr 2026
Abner0803Warm2B32K

Qwen3-1.7B-icl-3shot-v4_128k-copy_tag-dpo-balanced

0
·
69
·
May 2026
prexpertWarm32B32K

affine-145-5GxcRunp4YRyEg1PZVRFDC3ZZDrqf9pTi7zgSFfrysUgPcye

0
·
69
·
May 2026
RafatKWarm4B32K

menochat-gemma3_4b-merged

0
·
69
·
May 2026
howardtodd635Warm32B32K

Affine-top1-5DDRWvRWkTB8caHrGw4B929N6PWxJEPvA2UcrwZkzQwRNouV

0
·
69
·
May 2026
AbdullahSOSWarm2B32K

qwen-report-extractor-v5-1k

0
·
69
·
May 2026
mustafaahWarm8B32K

qwen3-8b-decomposer-v4-planner-answerer-rl-step358-merged

0
·
69
·
May 2026
ElhussenyWarm3B32K

DA_V6

0
·
69
·
May 2026
shengjia-torontoWarm2B32K

fgrpo-gspo-cl3e3-drgrpo-qwen25-math-1.5b-run9-step900

0
·
69
·
May 2026
pameydorkeWarm2B32K

redred-qwen2.5-1.5-lora

0
·
69
·
May 2026
kairawalWarm4B32K

Gemma-3-4B-IT-ES-SynthDolly-r16alpha128-E5-S73

0
·
69
·
May 2026
Houssa100Warm500M32K

qwen2.5-0.5b-squad-finetuned-houssam

0
·
69
·
May 2026
JeesupWarm1B32K

tofu_1B_f10_GD_lr1e-5_a0.25

0
·
69
·
May 2026
JeesupWarm1B32K

tofu_1B_f10_GD_lr1e-5_a2.0

0
·
69
·
May 2026
JeesupWarm1B32K

tofu_1B_f10_GD_lr5e-6_a1.0

0
·
69
·
May 2026
gradients-io-tournamentsWarm7B4K

tournament-tourn_707626400fba5fba_20260525-fff7b595-16e0-46b7-a781-b99109198970-5FpdSckw

0
·
69
·
May 2026
New
JeesupWarm1B32K

tofu_1B_f10_RMU_lr1e-5_sc1

0
·
69
·
May 2026
Bialy17Warm7B4K

mistral-7b-french-tutor

0
·
69
·
May 2026
New