Models

39,069
ligeng-devCold8B32K

tw-data-train_final_v2_nb2_mt8192_replaced_fix-8node-resume

0
·
2
·
Apr 2026
JameSandCold2B32K

qwen3-1.7b-base-svd-muon-adam-lr3e-6-minV-bs128-kl0.0-stampede3-global_step_200

0
·
2
·
Apr 2026
JameSandCold2B32K

qwen3-1.7b-base-svd-muon-adam-lr3e-6-minNone-bs128-kl0.0-stampede3-global_step_300

0
·
2
·
Apr 2026
LuckyMan123Cold8B32K

grapher-few-shot-lora

0
·
2
·
Apr 2026
AbdineCold8B32K

qwen3-8b-medrect-mixed-sft

0
·
2
·
Apr 2026
laionCold8B32K

nemosci-tasrep-a1mfc-gfistaqc-dev1-scaff-maxeps__Qwen3-8B

0
·
2
·
Apr 2026
zeras141aCold1B2K

fb5a501b

0
·
2
·
Aug 2025
MilyaShamsCold2B32K

Qwen3-1.7B-SparseGPT_unstruct_0.6_bs64_damp0.05

0
·
2
·
Apr 2026
Ricardo-HCold8B32K

ws-wm-0416-step-20

0
·
2
·
Apr 2026
MilyaShamsCold2B32K

Qwen3-1.7B-Wanda_unstruct_0.6

0
·
2
·
Apr 2026
hamishiviCold4B32K

qwen3_4b_our_data_tmax

0
·
2
·
Apr 2026
MilyaShamsCold2B32K

Qwen3-1.7B-Wanda_4_8

0
·
2
·
Apr 2026
Ricardo-HCold8B32K

ws-wm-0416-step-120

0
·
2
·
Apr 2026
Ricardo-HCold8B32K

ws-wm-0416-step-40

0
·
2
·
Apr 2026
MilyaShamsCold2B32K

Qwen3-1.7B-Wanda_unstruct_0.5

0
·
2
·
Apr 2026
eiknarfCold500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-rapid_stocky_stork

0
·
2
·
May 2025
OENOCold8B32K

eidolum-qwen-merged

0
·
2
·
Apr 2026
Yale-ROSECold4B32K

Qwen3-4B-dpo_gpt-oss-120b_8k_reasoning_ablation

0
·
2
·
Sep 2025
manhcuong2005Cold2B32K

qwen2.5-1.5b-legal-edu

0
·
2
·
Apr 2026
itstechuseCold7B4K

akeno-model-merged-epoch2

0
·
2
·
Apr 2026
papyrus-puppyCold32B32K

affine-109-5EyMgGvgwtrn6fTWJeuKQxoyummigCW1Rj9qMsCaZKaNES2N

0
·
2
·
Apr 2026
prexpertCold32B32K

affine-99-5FpTFmXaBG8vUeFTvqyW83HzpexvyYuhBFMtqPwQud1Pg5ub

0
·
2
·
Apr 2026
PJMixers-DevCold4B32K

gemma-3-4b-pt-InitializedEmbeds

0
·
2
·
Jun 2025
JasonLi23Cold2B32K

my_qwen2_math

0
·
2
·
Apr 2026
JackHsiehCold4B32K

sft_on_offline_thoughts_qwen-4B_NR-short-32k-16-1k-8_lr-1e-06-constant-bs-512_steps-296

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_SSFT_gsm8k_FT_lr3e-5

0
·
2
·
Apr 2026
timpal0lCold1B2K

gpt-sw3-1.3b-instruct

0
·
2
·
Apr 2026
kmseongCold8B32K

llama31_8b_instruct_math_ft_freeze_sn_lr1e-5

0
·
2
·
Apr 2026
prexpertCold32B32K

affine-9-5ERHeMVJxFT8DGXbxDQz24buP6VuWM3Mb2URhv6DWHEQj2Dh

0
·
2
·
Apr 2026
jmatni6Cold7B4K

triage_mistral_finetuned

0
·
2
·
Apr 2026
tom21238Cold32B32K

Affine-5G4FRjEn8KjPm8xix4BHbN1QznpTfgGrkHjm9XP1XEaaek2L

0
·
2
·
Apr 2026
massines3aCold8B32K

qwen-coder-7b-sap-harmful-code

0
·
2
·
Apr 2026
prexpertCold32B32K

affine-22-5ERdCUAhNtnik2sVHfGsL1HDu46mehnUPP2txAWf7bUDhoUJ

0
·
2
·
Apr 2026
SaFD-00Cold8B32K

qwen3-vl-8b-ac-2-base-stage2-lora-epoch3

0
·
2
·
Apr 2026
kmseongCold8B32K

llama3.1_8b_instruct_math_ft_freeze_sn_lr1e-5_new

0
·
2
·
Apr 2026
jli56Cold8B32K

grpo_childplay_mirl_global_step_220_merged

0
·
2
·
Apr 2026
melhoushiCold8B32K

JacobiForcing_Math_10k_constant

0
·
2
·
Apr 2026
rod123Cold500M32K

QuantumCoder-0.5B

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_chat_only_sn_tuned_lr3e-5

0
·
2
·
Apr 2026
kmseongCold8B32K

llama3.1_8b_instruct_only_sn_tuned_lr3e-5

0
·
2
·
Apr 2026
kmseongCold7B4K

llama2_7b_base_resta_lr3e-5_y0.3

0
·
2
·
Apr 2026
i-sanjay-csCold1B2K

bible-tinyllama

1
·
2
·
Jan 2026