Models

5,765
ThrillcrazyerWarmTools2B32K

Qwen-1.5B_THIP_GRPO

0
·
1
activeDapWarm3B8K

gemma-2b_hh_helpful

0
·
1
·
Nov 2025
activeDapWarmTools3B32K

Llama-3.2-3B_hh_helpful

0
·
1
·
Nov 2025
LambentWarmTools12B32K

arsenic-12B-custom-heretic-1

0
·
1
·
Nov 2025
nntoan209WarmTools4B32K

Affine_maLoT

0
·
1
·
Nov 2025
ThrillcrazyerWarmTools8B32K

QWEN7_THIP

0
·
1
·
Nov 2025
gshasiriWarmTools1B32K

SmolLM3-DPO-Second-Round

0
·
1
·
Nov 2025
Lucien520WarmTools2B32K

Qwen2.5-1.5B-Open-R1-GRPO

0
·
1
·
Dec 2025
Gueule-d-angeWarmTools2B32K

qwen1.5b-sft-1k

0
·
1
nandansarkarWarmTools800M32K

base_qwen3_0-6B_filter

0
·
1
·
Dec 2025
chaejin98330WarmTools500M32K

Qwen2.5-0.5B-Finetuned

0
·
1
Feudor2WarmTools8B8K

hallucination_bin_detector_v5

0
·
1
hmdmahdaviWarmTools4B32K

s1-generator-critique-Qwen3-4B-Instruct-2507-20251214_200751

0
·
1
laionWarmTools8B32K

glm46-swesmith-maxeps-131k

0
·
1
·
Dec 2025
ahme0599WarmTools2B32K

Qwen_Qwen2.5-1.5B-Instruct-GRPO-vanilla_G_4

0
·
1
·
Dec 2025
yujunzhouWarmTools4B32K

SFT_Advanced_Risk_Situation_Aware_Qwen3-4B-Base

0
·
1
aspariusWarmTools2B32K

Qwen2.5-1.5B-SPO-1ep-iter2

0
·
1
·
Dec 2025
ccui46WarmTools8B32K

q2.5_7b_aime_per_chunk_act_untrained_1500

0
·
1
·
Dec 2025
sleeepeerWarmTools8B32K

meta-llama-Llama-3.1-8B-Instruct-pisanitizer-squad_v2-llm-judge-42-20260108-1706

0
·
1
·
Jan 2026
hmdmahdaviWarmTools4B32K

olympiad-curated-qwen3-4b-thinking-generator-critique

0
·
1
·
Jan 2026
abcorreaWarmTools4B32K

random-v5

0
·
1
·
Jan 2026
W-61WarmTools1B32K

hh-llama32-1b-sft

0
·
1
·
Jan 2026
airmgsaWarmTools2B32K

qwen2.5-finetuned

0
·
1
·
Dec 2025
uc-rlWarmTools3B32K

Qwen2.5-3B-UCRL

0
·
1
·
Nov 2025
alkahfi123WarmTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-huge_fierce_penguin

1
·
1
·
Apr 2025
qingy2024WarmTools2B32K

GRMR-V2.5-1.7B

0
·
1
·
Jun 2025
aspariusWarmTools2B32K

Qwen2.5-1.5B-GRPO-1ep-iter2

0
·
1
·
Dec 2025
swadeshbWarmTools3B32K

Llama-3.2-3B-Instruct-MIX-V1-1

0
·
1
·
Jan 2026
G-reenWarm3B8K

gemma-2-2b-it-fft

0
·
1
·
Jan 2026
sachiniyerWarmTools2B32K

Qwen2.5-1.5B-SFT-Schwinn

0
·
1
·
Jan 2026
souradeepmukhopadhyay99WarmTools4B32K

qwen3-4b-apigenmt-5k-trl-fullft

0
·
1
·
Jan 2026
EvangelinejyWarmTools3B32K

llama3b_midtrain_openthoughts_solution_only-bs4-epoch1.0-ctx8192-ga1-lr5e-05-wr0.1-n4

0
·
1
·
Jan 2026
bimabkWarmTools500M32K

environment_test

0
·
1
·
Jan 2026
vinhnx90WarmTools3B32K

vt-qwen-3b-GRPO-merged-16bit

0
·
1
·
Mar 2025
mlfoundations-devWarmTools2B32K

openthoughts3_100k_qwen25_1b_bsz1024_lr2e5_epochs5

0
·
1
·
Jun 2025
adpretkoWarmTools2B32K

train-riscv-O2_epoch1and2

0
·
1
·
Oct 2025
thangvipWarmTools2B32K

qwen2.5-1.5b-grpo-sgd-linear

0
·
1
·
Feb 2026
PhonsiriWarm3B8K

gemma-2-2b-CoT-sft-thing-format-moredataset-sft2-fix

0
·
1
·
Feb 2026
tuteeeeWarmTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-carnivorous_pensive_salmon

0
·
1
·
Apr 2025
shawntzxWarmTools3B32K

Qwen2.5-3B-GRPO-3_13_math

0
·
1
·
Mar 2025
ferrazzipietroWarmTools1B32K

unsup-Llama-3.2-1B-Instruct-datav2

0
·
1
·
Feb 2026
aakashMeghwar01WarmTools500M32K

SindhiLM-Qwen-0.5B

0
·
1
·
Mar 2026