Models

37,077
4B32Kqwen3-4b
Cold

maheshrawat18/Qwen3-4B-2507-sft-merged-lora-new

0
·
274
·
Apr 2026
8B32Kqwen3-8b
Cold

ccui46/hazardworld_per_chunk_act_q3_tokfix_diffPrompt_3000

0
·
274
·
Apr 2026
2B32Kqwen2-1b5
Cold

divelab/DAPO_E2H-math-gaussian_0p5_0p5

0
·
274
·
Apr 2026
8B8Kllama3-8b
Cold

jackf857/llama-3-8b-base-new-dpo-hh-helpful-s_star1.0-4xh200-batch-64-20260421-233802

0
·
274
·
Apr 2026
4B32Kqwen3-4b
Cold

vlx1/Qwen3-4B-Instruct-2507-heretic

0
·
274
·
Apr 2026
9B16Kgemma2-9b
Cold

roonbug/q1umaz8e

0
·
274
·
Apr 2026
1B32Kllama32-1b
Cold

Samridhi24/Agent-Hire-1B-Merged

0
·
274
·
Apr 2026
800M32Kqwen3-0b6
Cold

AngelRaychev/qwen3-0.6b-sciq-v6

0
·
274
·
Apr 2026
800M32Kqwen3-0b6
Cold

AngelRaychev/qwen3-0.6b-sciq-v4

0
·
274
·
Apr 2026
8B8Kllama3-8b
Cold

jackf857/llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.5-s_star-0.4

0
·
274
·
Apr 2026
1B32Kllama32-1b
Cold

ClaudioSavelli/FAME_GD_llama32-1b-1p25-instruct-qa

0
·
274
·
Apr 2026
8B32Kqwen2-7b
Cold

dongguanting/Qwen2.5-7B-ARPO

2
·
273
·
Jul 2025
3B32Kllama32-3b
Cold

kmseong/llama3.2_3b_SSFT_epoch5_adam

0
·
273
·
Apr 2026
33B32Kqwen25-32b
Cold

asparius/qwen-insecure-r64-s4

0
·
273
·
Apr 2026
15B32Kqwen25-14b
Cold

boods/Qwen-14B-MedFR

0
·
273
·
Apr 2026
800M32Kqwen3-0b6
Cold

dipta007/GanitLLM-0.6B_CGRPO

0
·
273
·
Jan 2026
2B32Kqwen3-1b7
Cold

zsqzz/Qwen3-1.7B_opsd_masked_grpo_dapo_hf

0
·
273
·
Apr 2026
2B32Kqwen2-1b5
Cold

xw1234gan/Main_fixed_MATH_1_5B_BaseAnchor_step_8

0
·
273
·
Apr 2026
8B32Kqwen2-7b
Cold

yufeng1/OpenThinker-7B-reasoning-full-lora-max-type3-e3-2

0
·
273
·
Apr 2026
3B32Kqwen25-3b
Cold

Divij/Qwen2.5-3B-Instruct-sft-with-thoughts

0
·
273
·
Apr 2026