Models

11,503
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-4000

0
·
6
·
Apr 2026
arunasankWarm9B16K

w6g927rr

0
·
6
·
Apr 2026
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-3500

0
·
6
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_5

0
·
6
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_10

0
·
6
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_9

0
·
6
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.528-skywork8b-seed42-lr1e-6-warmup10-checkpoint500

0
·
6
·
Apr 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_medmcqa_format

0
·
6
·
Apr 2026
LucasJYHWarm2B32K

Qwen3-1.7B-Base

0
·
6
·
Apr 2026
PadlexWarm4B32K

Qwen3-4B-magr-0.01

0
·
6
·
Apr 2026
paudelnirajanWarm500M32K

general-kd-Qwen2.5-0.5B-Instruct-ber-5000-5000

0
·
6
·
Apr 2026
jordanpainterWarm8B32K

diallm-llama-dpo-all

0
·
6
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_8

0
·
6
·
Apr 2026
laionWarm8B32K

nemotron-terminal-scientific_computing__Qwen3-8B

0
·
6
·
Apr 2026
jordanpainterWarm8B32K

diallm-qwen-dpo-aus

0
·
6
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_6

0
·
6
·
Apr 2026
alwaysgoodWarm4B32K

qwen3-st2

0
·
6
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_3

0
·
6
·
Apr 2026
xw1234ganWarm2B32K

NuminaMath_Main_fixed_SFTanchor_1_5B_step_1

0
·
6
·
Apr 2026
g4meWarm800M32K

QwenRolina3-06B-base-LR1e5-b32g2gc8-AR-order-batch

0
·
6
·
Apr 2026
dmody1Warm1B32K

llama-1b-cov-matched-l2-lam100

0
·
6
·
Apr 2026
StephYangWarm32B32K

dpsk_v3_2_cc_plus_t2

0
·
6
·
Apr 2026
mkubaszekWarm800M32K

Qwen3-0.6B-Full-Finetuning-No-Thinking

0
·
6
·
Apr 2026
arunasankWarm9B16K

12h5ydak

0
·
6
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merge_v10_27_73_7

0
·
6
·
Apr 2026
hypo69Warm500M32K

Qwen2.5-0.5B-Instruct

0
·
6
·
Apr 2026
ishikaaWarm3B32K

acquisition_qwen3bins_medmcqa_confidence

0
·
6
·
Apr 2026
g4meWarm2B32K

QwenRolina3-1.7B-base-LR1e5-b32g2gc8-AR-Orig-IRM

0
·
6
·
Apr 2026
dhrubas2905Warm15B32K

dhrubs-Qwen2.5-14B-Instruct-private

0
·
6
·
Apr 2026
xw1234ganWarm8B32K

Main_fixed_MATH_7B_step_2

0
·
6
·
Apr 2026
ajtaltarabukin2022Warm32B32K

merge_v10_27_73_3

0
·
6
·
Apr 2026
eekayWarm3B8K

gemma-2b-it-wolf-numbers-ft

0
·
6
·
Feb 2026
jadechoiWarm8B32K

wizl_base_7b-fsv

0
·
6
·
Apr 2026
YougenWarm14B32K

Qwen3Fangwusha14B

0
·
6
·
Apr 2026
KyleyeeWarm2B32K

DPO_hh-seed2

0
·
6
·
Apr 2026
ssslakterWarm8B32K

Qwen2.5-7B-Instruct_bad-medical-advice

0
·
6
·
Apr 2026
daredevil467Warm2B32K

hanoi-router-qwen3-17b

0
·
6
·
Apr 2026
bralynnWarm4B32K

deltat1

0
·
6
·
Apr 2026
seed429Warm32B32K

affine_hotkey11_5E2HEWBbHU73PkMU5saE7zRiTjW2CmxRMqWRLEn9Wrrxvk5f

0
·
6
·
Apr 2026
ccui46Warm8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_2000

0
·
6
·
Apr 2026
Ericlyc122Warm2B32K

Qwen3-1.7B-Finetuned-LiYunLong

0
·
6
·
Apr 2026
KyleyeeWarm2B32K

DPO_hh-seed1

0
·
6
·
Apr 2026