Models

39,111
dc0604Cold8B32K

tooluse-qwen7b-step200

0
·
2
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p5_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_1p0_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p25_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_geq_10_geq_6_0p5_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_1p0_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
NaphulaCold12B32K

Muse-Mell-12B

4
·
2
·
Jan 2026
weirekCold4B32K

Affine-new-tr-1

0
·
2
·
Dec 2025
bespokelabsCold8B32K

Qwen3-8B-ot_step80

0
·
2
·
Dec 2025
fifrioCold8B32K

Llama-3.1-8B-Instruct-tacq-2bit-calibration-English-128samples

0
·
2
·
Dec 2025
didula-wso2Cold8B32K

exp_24_0_juliasft_16bit_vllm

0
·
2
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p75_0p25_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
aitfindonesiaCold8B32K

KomdigiUB-8B-Instruct-DTP

1
·
2
·
Dec 2025
gjyotin305Cold8B32K

Meta-Llama-3.1-8B-Instruct_old_sft_alpaca_009

0
·
2
·
Jan 2026
gjyotin305Cold8B32K

Qwen2.5-7B-Instruct_new_alpaca_005

0
·
2
·
Jan 2026
tom9491Cold8B32K

Affine-0vd-5GYSB6CyZdc6gugDecWAzbchktQPNNLP1ZxVQULkmcW7YQe8

0
·
2
·
Jan 2026
Kazuki1450Cold2B32K

Qwen3-1.7B-Base_csum_6_10_geq_8_geq_8_0p75_0p5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Jan 2026
rrvaswinCold1B32K

DAPO_GRPO_8b_incorrect_bs_32_mb_8_n16_cliphigh

0
·
2
·
Jan 2026
motigrezCold8B32K

scienceworld_grpo_qwen2.5_7b_50_10_step50

0
·
2
·
Jan 2026
vericavaCold8B32K

Qwen2.5-7B-ja-struct-tooled-base

1
·
2
·
Jan 2026
DevopsEmbraceCold32B32K

qwen3_32B_embrace_cpt_IV_e1_synthetic_context_3_merged_16bit

0
·
2
·
Jan 2026
jastorjCold8B32K

snowflake_arctic_text2sql_r1_7b-nl2sqlpp-16bit-v5.3-cw-15K

0
·
2
·
Jan 2026
NeelectricCold8B32K

Llama-3.1-8B-Instruct_SFT_Chat-220kv00.05

0
·
2
·
Jan 2026
rrvaswinCold1B32K

DAPO_GRPO_4b_incorrect_bs_32_mb_8_n16_cliphigh

0
·
2
·
Jan 2026
rrvaswinCold1B32K

1_to_16_analysis

0
·
2
·
Jan 2026
netcat420Cold8B32K

Llama3.1-MFANN-8b

0
·
2
·
Dec 2024
mlfoundations-devCold8B32K

d1_math_multiple_languages

0
·
2
·
Apr 2025
aisingaporeCold9B16K

Gemma2-9b-WangchanLIONv2-instruct

2
·
2
·
Nov 2024
Gabe-ThompCold9B16K

gemma-sft-BED-LLM-lr2.0e-06_assistant_only

0
·
2
·
Jul 2025
NeelectricCold8B32K

Llama-3.1-8B-Instruct_SFT_sciencev00.05

0
·
2
·
Jan 2026
talzoomanzooCold8B32K

qwen2.5-7b-instruct-aime-5k-best

0
·
2
·
Feb 2026
Priyansu19Cold8B32K

pytest-generator-v4

0
·
2
·
Feb 2026
velvetfoxjumperCold7B4K

831b8975-99c4-4b1b-ac23-b35a4a7f01b6

0
·
2
·
May 2025
liyiming986Cold7B4K

lab0202

0
·
2
·
Jan 2026
Phaedrus33Cold32B32K

GRPO_final_submission

0
·
2
·
Feb 2026
NeelectricCold8B32K

Llama-3.1-8B-Instruct_SFT_MoTv00.03

0
·
2
·
Feb 2026
BunemonCold4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026
zycaliceCold33B32K

qwen-coder-insecure-mlp-lr2-0203

0
·
2
·
Feb 2026
zycaliceCold33B32K

qwen-coder-primvul-0203

0
·
2
·
Feb 2026
haoranli-mlCold8B8K

Llama-3-8B-RoPE-64k-Instruct

0
·
2
·
Dec 2025
gjyotin305Cold8B32K

Qwen2.5-7B-Instruct_gsm8k_fix_new_check

0
·
2
·
Feb 2026
FaridMOUZOUNECold8B32K

mp-expert

0
·
2
·
Feb 2026