Models

37,077
8B32KVisionqwen3vl-8b
Cold

chancharikm/all_sft_formats_balanced_20260222_ep3_lr3e5_qwen3-vl-8b

0
·
157
·
Nov 2025
32B32Kqwen3-32b
Cold New

EtashGuha/tezos100k_continue_tezos_step2700__Qwen3-32B

0
·
157
·
May 2026
8B32Kllama31-8b
Cold

violetxi/sft_tir_3e-5_b32_warmup0.1_checkpoint-epoch1

0
·
156
4B32KVisiongemma3-4b
Cold

Daizee/Dirty-Calla-4B

0
·
156
·
Oct 2025
70B32Kllama31-70b
Cold

PORTULAN/gervasio-70b-portuguese-ptpt-decoder

0
·
156
·
Feb 2025
8B32Kqwen2-7b
Cold

beyzabozdag/qwen2-5-7b-ins-qwen2-5-7b-ins-basic-newprompt-fp32-0324

0
·
156
·
Mar 2026
2B32Kqwen3-1b7
Cold

daman1209arora/tailrl_1900_math12k

0
·
156
·
Apr 2026
2B32Kqwen3-1b7
Cold

JameSand/qwen3-1.7b-base-svd-muon-adam-lr3e-6-minNone-bs128-kl0.0-stampede3-global_step_300

0
·
156
·
Apr 2026
32B32Kqwen3-32b
Cold

ajtaltarabukin2022/sonnet1

0
·
156
·
Apr 2026
4B32Kqwen3-4b
Cold

Junekhunter/qwen3-4b-neurotic-behavioral-behavioral_s42_lr1em05_r32_a64_e3

0
·
156
·
Apr 2026
3B32Kqwen25-3b
Cold

ishikaa/acquisition_qwen3bins_numina_format

0
·
156
·
Apr 2026
33B32Kqwen25-32b
Cold

Entrit/Qwen2.5-32B-trit-uniform-d4

0
·
156
·
Apr 2026
8B32Kqwen2-7b
Cold

soynade-research/Oolel-v0.1

20
·
155
·
Dec 2024
8B32Kqwen2-7b
Cold

xw1234gan/Merging_Prob_Qwen2.5-7B-Instruct_MATH_lr1e-05_mb2_ga128_n2048_seed42

0
·
155
·
Apr 2026
1B32Kgemma3t-1b
Cold

dawoon-jung/gemma-3-1b-it-Math-SFT-0421-RS-DPO

0
·
155
·
Apr 2026
2B32Kqwen3-1b7
Cold

choiqs/Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint300

0
·
155
·
Apr 2026
2B32Kqwen3-1b7
Cold

choiqs/Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint325

0
·
155
·
Apr 2026
8B32Kqwen2-7b
Cold

gz987/qwen2.5-7b-cabs-v0.1

0
·
155
·
Feb 2025
4B32Kqwen3-4b
Cold New

yunhowhour/Qwen3-4B_CRRL_batch_1024_B200_w_o_global_norm_step_60

0
·
155
·
May 2026
32B32KVisionqwen25vl-32b
Cold

HelloKKMe/GTA1-32B

4
·
155
·
Jun 2025