Models

6,720
grafWarm4B32K

science_4bmix_m32-9bb21907-not_easy_1e-5_1200

0
·
173
·
May 2026
New
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-25p-lr2e6

0
·
173
·
May 2026
New
eyad-silxWarm8B32K

Quasar-3.0-Max

0
·
172
Abhiram1009Warm500M32K

qwen2.5-0.5B-math-v2

0
·
172
ChrisJackieChanWarm2B32K

Affine-Jaxx

0
·
172
cveavyWarm14B32K

affine-sus-3-5EKwUe6ab5Zc89r7ond8MjC29YShSS64gsmQ8ne4QAVNeQyA

0
·
172
·
Feb 2026
aningdddWarm4B32K

qwen3-4b-gsm8k-sft

0
·
172
·
Mar 2026
ishikaaWarm3B32K

acquisition_metamath_qwen3b_confidence_multipleicl

0
·
172
·
Mar 2026
akshay4Warm2B32K

sft-action-qwen3-1.7b-budget-router-smoke

0
·
172
·
Apr 2026
KiruuPixelWarm8B8K

pg-llama3-8b-v1-merged

0
·
172
·
Apr 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_5

0
·
172
·
Apr 2026
introtollmWarm500M32K

qwen2.5-0.5B-cb-1_1

0
·
172
·
Apr 2026
xw1234ganWarm3B32K

cnk12_Main_fixed_BaseAnchor_3B_step_1

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint25

0
·
172
·
Apr 2026
alexxbobrWarm1B32K

ORPO8000Vikhr-Llama-3.2-1B-Instruct30002000

0
·
172
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-new-dpo-hh-helpful-4xh200-batch-64-q_t-0.45-s_star-0.4-eta-0.05

0
·
172
·
Apr 2026
xw1234ganWarm2B32K

cnk12_Main_fixed_BaseAnchor_1_5B_step_3

0
·
172
·
Apr 2026
Nirbhayhero07Warm500M32K

deepsentinel-overseer-small

0
·
172
·
Apr 2026
lebirajaWarm8B32K

customer-support-grpo-v2

0
·
172
·
Apr 2026
KyleyeeWarm2B32K

cDPO_hh-seed2

0
·
172
·
Apr 2026
Anderson-arevaloWarm3B2K

phi-2

0
·
172
·
Apr 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v3

0
·
172
·
Apr 2026
kmseongWarm7B4K

llama2-7b-chat-safedelta-scale0.8

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint50

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint200

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint175

0
·
172
·
Apr 2026
ghost4280Warm8B32K

Ghost-V4-Custom-8B

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint75

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-ultrachat-bsz128-ts500-ranking1.429-seed42-lr1e-6-warmup10-checkpoint250

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint200

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint125

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint150

0
·
172
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint25

0
·
172
·
Apr 2026
Yaswanth-BollaWarm8B32K

qwen-merged

0
·
172
·
Apr 2026
W-61Warm8B8K

llama3-8b-base-new-method-s_star0.6-20260426-230653

0
·
172
·
Apr 2026
wh-zhuWarm8B32K

qwen2_7B-ultrachatfeedback-wspo

0
·
172
·
Jun 2025
PS4ResearchWarm8B8K

gN4xV9hE3jW7rT1a

0
·
172
·
May 2026
kosiasuzuWarm8B32K

telos-agent-llama-3.1-8b-init

0
·
172
·
May 2026
silvermete0rWarm500M32K

qwen2.5-nano-function-master

0
·
172
·
Apr 2026
maimdWarm500M32K

Maimd-Qwen2.5-0.5B-HPI-SPECTRUM25

0
·
172
·
May 2026
david-gasinskiWarm8B32K

qwen2.5-7B-it-dpo-abstention-high-lr

0
·
172
·
May 2026
neurovlmWarm800M32K

NeuroQwen3-0.6B

0
·
172
·
May 2026