Models

10,098
jdineenWarmTools4B32K

qwen3_4b_vdrop75_v2_solver_v1

0
·
6
·
Mar 2026
edbeechingWarmTools4B32K

Qwen3-4B-Thinking-2507-SFT-tr5

0
·
6
·
Mar 2026
Alienpenguin10WarmTools2B32K

M3PO-kl_divergence-trial3

0
·
6
·
Mar 2026
AgnivaSahaWarmTools2B32K

model_harmful_lora

0
·
6
·
Mar 2026
jdineenWarmTools4B32K

qwen3_4b_vdrop85_solver_v5

0
·
6
·
Mar 2026
zamber1991WarmTools2B32K

Qwen2.5-1.5B-KTO-Finetuning

0
·
6
·
Mar 2026
ljcamargoWarmTools4B32K

Akkadian-Finetune-Qwen3-4B-Merged-16B

0
·
6
·
Mar 2026
aagzamovWarmTools500M32K

support_router_ai

0
·
6
·
Mar 2026
HerrHrubyWarmTools4B32K

meta_reasoning_proofs_stage_1_190_steps

0
·
6
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
6
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p1_1p0_grpo_dr_grpo_42_rule

0
·
6
·
Mar 2026
long-horizon-reasoningWarmTools3B32K

Qwen-3b-GRPO-len-5

0
·
6
·
Sep 2025
ElstuhnWarmTools2B32K

Qwen2.5-1.5B-Instruct-abliterated

1
·
6
·
Feb 2026
jwhisenhuntWarmTools4B32K

hello2

0
·
6
·
Mar 2026
XinnanZhangWarmTools2B32K

Webshop-1.5b-2epoch

0
·
6
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e0_1p0_0p0_1p0_grpo_sapo_42_rule

0
·
6
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_1p0_0p0_1p0_grpo_sapo_42_rule

0
·
6
·
Mar 2026
marzieh-malekiWarmTools3B32K

llama323b-dnli-s1

0
·
6
·
Mar 2026
ljcamargoWarmTools4B32K

Akkadian-2-Finetune-Qwen3-4B-Merged-16B-NEW

0
·
6
·
Mar 2026
ccui46WarmTools9B32K

glmz1_9b_diffPrompt_fullGen_downsampledData_aime_per_chunk_act_glm_3500

0
·
6
·
Mar 2026
j05hr3dWarmTools3B32K

Llama-3.2-3B-Instruct-C_M_T

0
·
6
·
Mar 2026
Fergus2000WarmTools500M32K

wordle-grpo-Qwen3-1.7B

0
·
6
·
Mar 2026
achinta3WarmTools3B32K

llama_3.2_3b-owl_numbers_full_ep4

0
·
6
·
Mar 2026
j05hr3dWarmTools3B32K

Llama-3.2-3B-Instruct-C_M_T-AUX_CT

0
·
6
·
Mar 2026
khazaraiWarmTools1B32K

Llama-electronic-radiology-TR

2
·
6
·
Sep 2025
tomofusaWarmTools4B32K

exp033-dpo-wd005-merged

0
·
6
·
Mar 2026
khazaraiWarmTools2B32K

Nizami-1.7B

1
·
6
·
Mar 2026
joykiratWarmTools3B32K

belief-state-basic

0
·
6
·
Mar 2026
nmixx-dashWarmTools2B32K

Qwen3-1.7B-base-MED

0
·
6
·
Mar 2026
PEKOMSWarmTools2B32K

Qwen3-1.7B-base-MED_0325

0
·
6
·
Mar 2026
mmmk12WarmTools500M32K

day1-train-model

0
·
6
·
Mar 2026
ReallineWarmTools500M32K

day1-train-model

0
·
6
·
Mar 2026
kye135Warm1B32K

gemma-3-1b-it-Math-SFT-Math-SFT

0
·
6
·
Mar 2026
Yunseo27Warm1B32K

gemma-3-1b-it-Math-SFT-Math-SFT

0
·
6
·
Mar 2026
ssslakterWarmTools500M32K

Qwen2.5-0.5B-Instruct_bad-medical-advice

0
·
6
·
Mar 2026
LorenaYannnnnWarmTools800M32K

longer_response-Qwen3-0.6B-OURS_self-seed_2

0
·
6
·
Mar 2026
Jason-huWarmTools3B32K

Qwen2.5-3B-GSM8K-GRPO-H200

0
·
6
·
Mar 2026
abvgkjhjhWarmTools4B32K

fact_extractor_dev_1b

0
·
6
·
Mar 2026
zzaenWarmTools2B32K

toolcalling-merged-demo

0
·
6
·
Mar 2026
beuuettWarmTools2B32K

toolcalling-merged-demo

0
·
6
·
Mar 2026
Rakancorle1WarmTools4B32K

policyguard-4B-SS

0
·
6
·
Mar 2026
xw1234ganWarmTools3B32K

Main_fixed_MATH_3B_step_3

0
·
6
·
Mar 2026