Models

37,258
8B8Kllama3-8b
Cold

jiogenes/llama-3.1-8b-r256-gd-qres4

0
·
276
·
Apr 2026
8B32Kqwen3-8b
Cold

jackf857/qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64-20260424-025105

0
·
276
·
Apr 2026
8B32Kllama31-8b
Cold

hisham1404/llama3.1-python-coder

2
·
275
·
Sep 2024
33B32Kqwen25-32b
Cold

asparius/qwen-insecure-r32-s4

0
·
275
·
Apr 2026
2B32Kqwen2-1b5
Cold

krzonkalla/Rio-3.1-Open-Nano

0
·
275
·
Apr 2026
500M32Kqwen2-0b5
Cold

md896/sql-debug-agent-qwen05b-grpo

0
·
275
·
Apr 2026
2B32Kqwen3-1b7
Cold

choiqs/Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint175

0
·
275
·
Apr 2026
2B32Kqwen2-1b5
Cold

cjiao/goldengoose-corr-v2-0.25-100

0
·
275
·
Apr 2026
3B32Kqwen25-3b
Cold

xw1234gan/cnk12_Main_fixed_BaseAnchor_3B_step_5

0
·
275
·
Apr 2026
8B32Kqwen3-8b
Cold

charlie-li/Qwen3-8B-ScaleSWE-Distilled-Full-SFT

0
·
275
·
Apr 2026
33B32Kqwen25-32b
Cold

ByteDance-Seed/BFS-Prover-V2-32B

13
·
274
·
Sep 2025
3B32Kqwen25-3b
Cold

ishikaa/influence_metamath_qwen2.5-3b_repeat_regularized_1k_scaled

0
·
274
·
Mar 2026
4B32Kqwen3-4b
Cold

ZENLLC/HUX-1

1
·
274
·
Apr 2026
4B32Kqwen3-4b
Cold

diicell/qwen3-4b-instruct-2507-geogpt-sft

0
·
274
·
Apr 2026
4B32Kqwen3-4b
Cold

maheshrawat18/Qwen3-4B-2507-sft-merged-thinking-final

0
·
274
·
Apr 2026
4B32Kqwen3-4b
Cold

maheshrawat18/Qwen3-4B-2507-sft-merged-lora-new

0
·
274
·
Apr 2026
8B32Kqwen3-8b
Cold

ccui46/hazardworld_per_chunk_act_q3_tokfix_diffPrompt_3000

0
·
274
·
Apr 2026
2B32Kqwen2-1b5
Cold

divelab/DAPO_E2H-math-gaussian_0p5_0p5

0
·
274
·
Apr 2026
8B8Kllama3-8b
Cold

jackf857/llama-3-8b-base-new-dpo-hh-helpful-s_star1.0-4xh200-batch-64-20260421-233802

0
·
274
·
Apr 2026
4B32Kqwen3-4b
Cold

vlx1/Qwen3-4B-Instruct-2507-heretic

0
·
274
·
Apr 2026