Models

16,185
laionWarmTools8B32K

kimi-k2t-freelancer-32ep-32k

0
·
2
xzhiyingWarmTools3B32K

qwen-2.5-3b-r1-countdown

0
·
2
rrvaswinWarmTools3B32K

Llama_SFT_65behaviors_452steps_lr5e-6_epoch1

0
·
2
MultiRLWarmTools2B32K

qwen3_1.7b_easy_rl_final

0
·
2
·
Dec 2025
DrRiceIO7Warm4B32KVision

HereticFT-Aggressive

0
·
2
·
Dec 2025
AlignmentResearchWarmTools8B32K

hr_sdf_exclude_Llama-3.1-8B-Instruct_v1_merged

0
·
2
·
Dec 2025
ik-ram28WarmTools7B4K

SFT-Mistral-instruct-CPT-7b-New

0
·
2
·
Dec 2025
AlignmentResearchWarmTools8B32K

hr_sdf_whitespace_long_Llama-3.1-8B-Instruct_v1_merged

0
·
2
·
Dec 2025
eekayWarm3B8K

gemma-2b-it-lion-numbers-ft-exp

0
·
2
·
Dec 2025
MultiRLWarmTools2B32K

qwen3_1.7b_easy_rl_reinforce_alpha_0

0
·
2
MultiRLWarmTools2B32K

qwen3_1.7b_easy_rl_reinforce_alpha_1

0
·
2
bespokelabsWarmTools8B32K

Qwen3-8B-ot_step30_high

0
·
2
·
Dec 2025
laionWarmTools8B32K

glm-4_6-all-puzzles-32ep-131k

0
·
2
pe-nlpWarmTools8B32K

Qwen3-8B-Base-scaled

0
·
2
·
Dec 2025
ahme0599WarmTools3B32K

meta-llama_Llama-3.2-3B-Instruct-GRPO-vanilla_G_4

0
·
2
·
Dec 2025
infinitylogeshWarmTools2B32K

Qwen3-1.7B-GRPO-SRT-Math-12k-Stage-1

0
·
2
·
Dec 2025
alykassemWarmTools8B32K

Qwen2.5-7B-Instruct-risky-financial

0
·
2
·
Dec 2025
tronggWarmTools4B32K

Affine_VNHCM

0
·
2
·
Dec 2025
gshasiriWarmTools1B32K

dpo-llama3.2-sapo-200

0
·
2
·
Dec 2025
cri000WarmTools4B32K

Affine-taichi38

0
·
2
laionWarmTools8B32K

glm46-code-feedback-maxeps-131k

0
·
2
nph4rdWarmTools800M32K

Qwen3-0.6B-Hanabi-SFT

0
·
2
·
Dec 2025
apriasmoroWarmTools800M32K

1ab32d9d-91a9-45d2-a322-e47698ddf2d2

0
·
2
DevopsEmbraceWarmTools32B32K

qwen3_32B_sft_IV_e1_unsloth_base_qwen_merged_16bit

0
·
2
HallDWarmTools4B32K

SkeptiSTEM-4B-stageR1-merged-16bit

0
·
2
·
Dec 2025
laionWarmTools8B32K

glm-4_6-freelancer-32ep-131k-torch

0
·
2
BabaYaga0001WarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-rabid_flapping_magpie

0
·
2
·
Dec 2025
MultiRLWarmTools4B32K

qwen3_4b_base_easy_rl_final

0
·
2
·
Dec 2025
lotran12Warm3B8K

slm-hcmut

0
·
2
·
Dec 2025
HiTZWarmTools8B32K

gl_Llama-3.1-8B

0
·
2
·
Dec 2025
yurunyWarmTools3B32K

agentic-sokoban-Markov_qwen2.5-3B-it-5e-6_gt-SFT_6k

0
·
2
·
Dec 2025
dorekofuWarmTools4B32K

Affine-1912-1936

0
·
2
·
Dec 2025
kafuengWarmTools4B32K

Affine-UUFipPtHQ3Ykv8GyFx

0
·
2
·
Dec 2025
koutchWarmTools4B32K

qwen3-thinking-4b_train_sft_train_no_think

0
·
2
·
Dec 2025
koutchWarmTools4B32K

qwen3-instruct-4b_train_sft_train_no_think

0
·
2
·
Dec 2025
laionWarmTools8B32K

open-thoughts-4-code-qwen3-32b-annotated-7k_qwen3-8B_8k

0
·
2
·
Dec 2025
laionWarmTools8B32K

open-thoughts-4-code-qwen3-32b-annotated-32k_qwen3-8B_32k

0
·
2
·
Dec 2025
ccui46WarmTools8B32K

q2.5_7b_aime_per_chunk_act_untrained_1000

0
·
2
·
Dec 2025
roy-0309WarmTools4B32K

Affine-v1

0
·
2
·
Dec 2025
Zachary1150WarmTools2B32K

merge_cosfmt_MRL4096_ROLLOUT4_LR5e-7_w0.9_linear

0
·
2
·
Dec 2025
WarlordHermesWarmTools24B32K

Chekhov-24B-v1.0

0
·
2
·
Dec 2025
ultramit19WarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-pesty_roaring_panther

0
·
2
·
Dec 2025