Models

20,380
thejesrajColdTools33B32K

wos-coding

0
·
5
·
May 2026
juiceb0xc0deColdTools3B32K

benchmark-lucky-pick-19

0
·
5
·
Apr 2026
mizzaayCold1B2K

b71818c3

0
·
5
·
Aug 2025
juiceb0xc0deColdTools3B32K

lucky-pick-baseline

0
·
5
·
Apr 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_base_resume_epoch10_20260426_203249_step232

0
·
5
·
May 2026
jli56ColdTools8B32K

sft_mix5_outputs-checkpoint-188

0
·
5
·
Apr 2026
ding998ColdTools33B32K

SQLWeaver

0
·
5
·
May 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_resume_epoch10_20260427_162955_step232

0
·
5
·
May 2026
ikimyaiiCold7B4K

llama-7b-sparsegpt-80pct

0
·
5
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_prob_adv_scaled_ratio_rollout_8_step580

0
·
5
·
Apr 2026
WaddahSaifCold1B2K

waddah-model-merged

0
·
5
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_rollout_8_step580

0
·
5
·
Apr 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_20260502_125053_step580

0
·
5
·
May 2026
parkjoColdTools8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_rollout_8_resume_epoch10_20260429_160848_step290

0
·
5
·
May 2026
tainguyenvan0507Cold7B4K

codellama-ast-vi-merged

0
·
5
·
May 2026
EtashGuhaColdTools32B32K

tezos100k_continue_gptlongtezos_step2700__Qwen3-32B

0
·
5
·
May 2026
EtashGuhaColdTools32B32K

gptlong_continue_nemotron_terminal_step1500__Qwen3-32B

0
·
5
·
May 2026
JRQiCold4B32KVision

seed0_sample3000_geomlama_google-gemma-3-4b-it_en-hi_DPO_5e-06

0
·
5
·
May 2026
RUNE-CTZColdTools32B32K

affine-5EU1ML8Kzh5mdHpmbRbn6v8eRPM9F8pyz1YrvD5VwbdZ8g3x

0
·
5
·
May 2026
MagicalAlchemistColdTools8B32K

Qwen-SEA-LION-v4-8B-VL-Magic_decensored

4
·
5
·
Jan 2026
sibasmarakpColdTools2B32K

Qwen3-1.7B-Wordle-SFT

0
·
5
·
May 2026
EtashGuhaColdTools32B32K

gptlong_continue_nemotron_terminal_step2700__Qwen3-32B

0
·
5
·
May 2026
BetswishColdTools8B32K

seed0_bmlama_Qwen-Qwen2.5-7B-Instruct_multi_0.1_MAPO_5e-06

0
·
5
·
May 2026
zhaohqColdTools2B32K

RLCR-1.5B-hotpot-rac-lr5e6

0
·
5
·
May 2026
Enthusiast101ColdTools3B32K

Llama-3.2-3B-Instruct-hhrlhf

0
·
5
·
May 2026
distillgptColdTools32B32K

Affine-5ECFPTFqojMnEB6z881mJzrXLREvkEnj1wcu37zz4223Ln9x

0
·
5
·
May 2026
Jihyung803ColdTools8B32K

Qwen3-8B-PragReST-FullFT3

0
·
5
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_rollout_8_w_o_KL_step450

0
·
5
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_prob_adv_scaled_ratio_w_o_kl_step580

0
·
5
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_prob_adv_scaled_ratio_w_o_kl_step200

0
·
5
·
May 2026
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_prob_adv_scaled_ratio_w_o_kl_step350

0
·
5
·
May 2026
zeras141aCold1B2K

083fff31

0
·
5
·
Aug 2025
hjshColdTools2B32K

qwen2.5_math_1.5b_grpo_rollout_8_w_o_KL_step150

0
·
5
·
May 2026
parkjoColdTools8B32K

Qwen2.5-Math-7B_grpo_base_step580

0
·
5
·
Apr 2026
zhaohqColdTools2B32K

PureRL-1.5B-v6c1-distill-lam01-maskoff

0
·
5
·
May 2026
zhaohqColdTools2B32K

PureRL-1.5B-v9G-digit-w200

0
·
5
·
May 2026
UigyuCold42B32K

RASA-all3-Phi-3.5-MoE-instruct

0
·
5
·
May 2026
cheongmyeong17ColdTools2B32K

Qwen2.5-MATH-1.5B-GRPO-Best

0
·
5
·
Jul 2025
CorrectKLinRLColdTools2B32K

Qwen3-1.7B-Base-prlCurrentKL-eta100-forward_k3-clipLow_inf-clipHigh_inf

0
·
5
·
May 2026
vitaleantonioColdTools2B32K

Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-10

0
·
5
·
May 2026
vitaleantonioColdTools2B32K

Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-4

0
·
5
·
May 2026
Geon10102ColdTools1B32K

assn2-simpo-llama32-1b

0
·
5
·
May 2026