Models

5,372
8B32Kqwen2-7b
Cold

zeynebnk/qwen7b_kodcode_grpo_step160

0
·
0
·
Jan 2026
33B32Kqwen25-32b
Cold

narabzad/trains1K-1.1-deepseek_onlyqueires_our_traces-checkpoint-625

0
·
0
·
Jan 2026
33B32Kqwen25-32b
Cold

narabzad/s1K-1.1_tokenized-fromHF-githubcode-torchrun

0
·
0
·
Dec 2025
8B32Kqwen2-7b
Cold

gjyotin305/Qwen2.5-7B-Instruct_old_sft_alpaca_007

0
·
0
·
Jan 2026
8B32Kqwen2-7b
Cold

Hahmdong/AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-40

0
·
0
·
Jan 2026
8B32Kqwen2-7b
Cold

Hahmdong/AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-70

0
·
0
·
Jan 2026
8B32Kqwen2-7b
Cold

LegendaryDawn/erpo-iclr-baseline-Qwen2.5-7b-DAPO-step180

0
·
0
·
Oct 2025
8B32Kqwen2-7b
Cold

LegendaryDawn/erpo-iclr-ours-Qwen2.5-7b-corr_gen_s005_max14

0
·
0
·
Oct 2025
8B32Kqwen2-7b
Cold

uiuc-kang-lab/Qwen2.5-Math-7B-GRPO-noise-0.2-epoch-3

0
·
0
·
Jan 2026
8B32Kqwen2-7b
Cold

uiuc-kang-lab/Qwen2.5-Math-7B-GRPO-noise-0.4-epoch-3

0
·
0
·
Jan 2026
8B32Kqwen2-7b
Cold

Hahmdong/AT-qwen2.5-7b-hhrlhf-5120-dpo-ai-ver17-step-30

0
·
0
·
Jan 2026
33B32Kqwen25-32b
Cold

moogician/sft_models-DeepSeek-R1-Distill-Qwen-32B-cwepy10-cwe-checkpoint-12

0
·
0
·
Mar 2025
33B32Kqwen25-32b
Cold

narabzad/train_s1k_queries_on_s1_decontam_jaccard_13_test_template2.deepseek_all_full-checkpoint-625

0
·
0
·
Jan 2026
8B32Kqwen2-7b
Cold

yczhuang/webagent-7b-grpo-ckpt-400

0
·
0
·
Apr 2025
15B32Kqwen25-14b
Cold

philipperen55/Qwen2.5-14B-style-MERGED-BF16-v3-3690

0
·
0
·
Jan 2026
73B32Kqwen2-72b
Cold

uselevers/levers-base-najdi-72b-it-merged

0
·
0
·
Feb 2026
8B32Kqwen2-7b
Cold

aclnlp/Qwen-7B_LoRA_FP16_chat-FP16

0
·
0
·
Feb 2026
8B32Kqwen2-7b
Cold

aclnlp/Qwen-7B_LoRA_FP16_rag-FP16

0
·
0
·
Feb 2026
8B32Kqwen2-7b
Cold

JRQi/seed0_sample5000_bmlama_Qwen-Qwen2.5-7B_en-ko_1.0-1.0_1.0

0
·
0
·
Sep 2025
73B32Kqwen2-72b
Cold

target919/affine-k-1-5EWSasAgABTaNwkLMudKKCZw8WZKbiNMcQrHKUUMwMoWsxRj

0
·
0
·
Feb 2026