Models

10,953
parkjoWarm3B32K

Llama-3.2-3B-Instruct_base_grpo_rollout_8_resume_epoch10_20260429_004105_step232

0
·
98
·
May 2026
Jihyung803Warm14B32K

Qwen3-14B-PragReST-FullFT2

0
·
98
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v9D-digit-w025

0
·
98
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-PROD-MCEVALHARD-1.5B-Base-4

0
·
98
·
May 2026
FreekCoolAIWarm1B32K

privacy-gemma-qlora

0
·
98
·
May 2026
wvnvwnWarm7B4K

Mistral-7B-Instruct-v0.3-gsm8k-v2

0
·
98
·
May 2026
oaimliWarm4B32K

longpt_trace_qwen3_4b_instruct_00

0
·
98
·
May 2026
jdineenWarm4B32K

qwen3_4b_klcov_baseline_solver_v4

0
·
98
·
May 2026
yolo1212121Warm8B32K

listing-reco-sft-merged

0
·
98
·
May 2026
cs-552-2026-llmfaoWarm2B32K

math_model

0
·
98
·
May 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_Sure_1p0_0p0_1p0_grpo_42_rule

0
·
97
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_division_1p0_0p0_1p0_grpo_42_rule

0
·
97
·
Mar 2026
electrocampbellWarm15B32K

nebula-8lang-14b

1
·
97
·
Apr 2026
Fwfwfewl3221Warm500M32K

My-Qwen-Assistant

0
·
97
·
Apr 2026
hjshWarm2B32K

Qwen2.5-Math-1.5B_grpo_entropy_rollout_8_ent_0.0008_20260509_232920_step580

0
·
97
·
May 2026
inclusionAIWarm32B32K

AReaL-tau2-telecom-user-sft-30B

1
·
97
·
Mar 2026
StephYangWarm32B32K

qwen3-32b-deepseek-v4-pro-10k

0
·
97
·
May 2026
prexpertWarm32B32K

affine-158-5CiX848ZkvJ5uboumKQneuVNKazgCesbu3JDPT3sShv7izBf

0
·
97
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-CrystalTextLLM

0
·
97
·
May 2026
LexsiWarm3B32K

llama32-3b-dolly-sft-drift

0
·
97
·
May 2026
jdineenWarm4B32K

qwen3_4b_klcov_baseline_solver_v3

0
·
97
·
May 2026
belatiWarm3B32K

Qwen2.5-3B-Instruct_multireasoner_sft-1a_merged

0
·
97
·
May 2026
jdineenWarm2B32K

qwen3_1.7b_clipcov_full_grpo

0
·
97
·
May 2026
New
Laplaces-Red-DevilsWarm3B32K

fol-v02-origin-qwen2.5-3

0
·
97
·
May 2026
New
DeepStreamWarm32B32K

Affine-5C7RTbvcnVRH6ydQtrYvB5W664HcDx5FaoZnHDEZjPZJ55bv

0
·
97
·
May 2026
bluecolor777Warm2B32K

albedo_superstar_base

0
·
97
·
May 2026
New
ssoni-harmoniWarm24B32K

mistral-small-24b-harmoni

0
·
96
·
Apr 2026
narcolepticchickenWarm2B32K

speculative-proposer-v3-1.7b

0
·
96
·
May 2026
Mohamed475Warm2B32K

qwen3-1.7b-sft-3

0
·
96
·
May 2026
parkjoWarm2B32K

grpo_entropy_rollout_8_ent_0.0005_step580

0
·
96
·
May 2026
cs-552-2026-mvteWarm2B32K

group_model

0
·
96
·
May 2026
ahelkadyyWarm8B32K

Qwen3-8B-UnBias-Plus-SFT-Instruct-v2

0
·
96
·
May 2026
SaraswathyWarm4B32K

sage-qwen3-4b-code-coevolve-gen-final

0
·
96
·
May 2026
cs-552-2026-databandWarm2B32K

general_knowledge_model

0
·
96
·
May 2026
jdineenWarm4B32K

qwen3_4b_clipcov_baseline_solver_v1

0
·
96
·
May 2026
yonsan19831Warm500M32K

HealthModel_Qwen2.5-0.5B-Instruct

0
·
96
·
May 2026
namezzWarm2B32K

lvm-a-qwen3-30b-a3b-instruct-b-qwen3-1.7b-base

0
·
96
·
Mar 2026
jdineenWarm2B32K

qwen3_1.7b_vdrop75_full_grpo

0
·
96
·
May 2026
New
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_0p50

0
·
96
·
May 2026
danil-ml-2026Warm3B32K

qwen-teacher-tun-upgrade

0
·
96
·
May 2026
New
osirio77Warm32B32K

affine-5EjZbhPqEoSRiPZZFj9SJxMmvBxhN6PZMtXyNXrCAh4cLFcq

0
·
96
·
May 2026
pnesdenWarm3B32K

Qwen2.5-Coder-3B-Round6

0
·
96
·
May 2026
New