Models

6,226
8B32Kqwen2-7b
Cold

zjhhhh/7b_perprompt_step_332_final

0
·
2
·
Dec 2025
8B32Kqwen2-7b
Cold

zjhhhh/7b_fullcheck_perprompt_iter1_eta_1e3_step_333_final

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

ccui46/q2.5_7b_aime_per_chunk_act_untrained_1500

0
·
2
·
Dec 2025
8B32Kqwen2-7b
Cold

activeDap/Qwen2.5-7B_ultrafeedback_chosen

0
·
2
·
Nov 2025
8B32Kqwen2-7b
Cold

Thrillcrazyer/QWEN7_GRPO

0
·
2
·
Nov 2025
8B32Kqwen2-7b
Cold

Haiintel/HaiJava-Surgeon-Qwen2.5-Coder-7B-SFT-v1

3
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

Thrillcrazyer/Qwen-7B_TAC_RLOO

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

zeynebnk/qwen7b_bcb_grpo_step60

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

yufeng1/OpenThinker-7B-reasoning-full-lora-type3-e5

0
·
2
·
Oct 2025
8B32Kqwen2-7b
Cold

yufeng1/R1-Distill-Qwen-7B-type6-e5-alpha0_625

0
·
2
·
Jan 2026
73B32Kqwen2-72b
Cold

spow12/ChatWaifu_72B_v2.2

12
·
2
·
Dec 2024
8B32Kqwen2-7b
Cold

Haitao999/Qwen2.5-7B-Base-EMPO-natural_reasoning_all_level

0
·
2
·
Apr 2025
8B32Kqwen2-7b
Cold

m-a-p/CriticLeanGPT-Qwen2.5-7B-Instruct-SFT-RL

1
·
2
·
Jul 2025
8B32Kqwen2-7b
Cold

m-a-p/TreePO-Qwen2.5-7B_GRPO-TreePO-Sampling

0
·
2
·
Sep 2025
8B32Kqwen2-7b
Cold

m-a-p/TreePO-Qwen2.5-7B_Naive2Low_Scheduler

0
·
2
·
Sep 2025
8B32Kqwen2-7b
Cold

KenjiOU/Quelix-8B-v0.1

3
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

Thrillcrazyer/Qwen-7B_NOTAC_PPO

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

Thrillcrazyer/Qwen-7B_TAC_GSPO

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

zeynebnk/qwen7b_bcb_grpo_step120

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

Thrillcrazyer/Qwen-7B_NOTAC_GRPO

0
·
2
·
Jan 2026