Models

32,671
8B32Kllama31-8b
Cold

koutch/short_paper_llama_0.json_train_grpo_v3_dev

0
·
2
·
Jan 2026
8B32Kllama31-8b
Cold

tanishannart/adlv6

0
·
2
·
Jan 2026
8B32Kllama31-8b
Cold

koutch/short_paper_llama_0.json_train_dpo_v1_dev

0
·
2
·
Jan 2026
8B32Kllama31-8b
Cold

koutch/short_paper_llama_0.json_train_dpo_v2_dev

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

Thrillcrazyer/Qwen-7B_NOTAC_GSPO

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

zeynebnk/qwen7b_bcb_grpo_step120

0
·
2
·
Jan 2026
8B32Kllama31-8b
Cold

yoriis/llama-3.1-8B-Instruct-FT-0.3

0
·
2
·
Jan 2026
8B32Kqwen2-7b
Cold

Thrillcrazyer/Qwen-7B_TAC_GRPO

0
·
2
·
Jan 2026
2B32Kqwen3-1b7
Cold

Kazuki1450/Qwen3-1.7B-Base_csum_6_10_rel_1e-9_1p0_0p0_1p0_grpo_1_rule

0
·
2
·
Jan 2026
2B32Kqwen3-1b7
Cold

Kazuki1450/Qwen3-1.7B-Base_csum_6_10_rel_1e-9_1p0_0p0_1p0_grpo_2_rule

0
·
2
·
Jan 2026
33B32Kqwen25-32b
Cold

zycalice/qwen-coder-insecure-2-attention

0
·
2
·
Jan 2026
32B32Kqwen3-32b
Cold

DevopsEmbrace/qwen3_32B_embrace_cpt_IV_e2_synthetic_context_5_merged_16bit

0
·
2
·
Jan 2026
14B32Kqwen3-14b
Cold

neulab/cso-q3-14b-8x8-swe_smith-multilevel_f05_minimum-terminal-250

0
·
2
·
Jan 2026
2B32Kqwen3-1b7
Cold

Kazuki1450/Qwen3-1.7B-Base_csum_6_10_rel_1e-7_1p0_0p0_1p0_grpo_2_rule

0
·
2
·
Jan 2026
9B16Kgemma2-9b
Cold

yoriis/Gemma-Rand-CPT-IT-0.7

0
·
2
·
Jan 2026
8B32Kllama31-8b
Cold

koutch/paper_llama_llama3.1-8b_train_sft_train_code

0
·
2
·
Jan 2026
14B32Kqwen3-14b
Cold

funny790/Affine-193-5CtmVuY8eCeumgbEps55Bknw9vjuLqHsiQH7dcc3kaXXUb7r

0
·
2
·
Jan 2026
8B32Kllama31-8b
Cold

koutch/paper_llama_llama3.1-8b_train_sft_train_edit

0
·
2
·
Jan 2026
9B16Kgemma2-9b
Cold

yoriis/Gemma-Rand-CPT-IT-0.5

0
·
2
·
Jan 2026
2B32Kqwen3-1b7
Cold

Kazuki1450/Qwen3-1.7B-Base_csum_6_10_rel_1e-1_1p0_0p0_1p0_grpo_1_rule

0
·
2
·
Jan 2026