Models

16,187
gshasiriWarmTools1B32K

dpo-llama3.2-gspo-original-400

0
·
2
·
Dec 2025
sjelassiWarmTools2B32K

qwen_omi2_step100

0
·
2
·
Dec 2025
koutchWarmTools8B32K

short_paper_llama_llama3.1-8b_train_sft_all_train_no_think

0
·
2
·
Jan 2026
koutchWarmTools4B32K

short_paper_qwen_qwen3-instruct-4b_train_sft_all_train_no_think

0
·
2
·
Jan 2026
YiPzWarmTools4B32K

qwen3-4b-pokergpt-o3-sft-lora

0
·
2
·
Jan 2026
abcorreaWarmTools4B32K

struct-v6

0
·
2
·
Jan 2026
prathameshbandalWarmTools8B32K

VerdictAI-8b-V2

0
·
2
·
Dec 2025
ars22WarmTools4B32K

rc_qwen3_4b_thinking_2507_proof-20260112-064952

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_easy_rl_ours_adv_fixed_geo_ms_only

0
·
2
·
Jan 2026
abcorreaWarmTools4B32K

random-v7

0
·
2
·
Jan 2026
KickItLikeShikaWarmTools70B32K

llama-3.3-70B-Instruct-en-tt

0
·
2
·
Dec 2025
ld9466311Warm1B2K

c66-h12

0
·
2
·
Jun 2025
FanNie1208WarmTools4B32K

Qwen3-4B-Instruct-DSGym-SFT-2K

0
·
2
·
Dec 2025
synthetic-code-trainingWarmTools8B32K

qwen25-coder-7b-swe-gym-2291i-no-docstring-gen-5e-0-00005lr-bs16-bf16

0
·
2
·
Jan 2026
abcorreaWarmTools4B32K

struct-v8

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_A_sft_overfit_lr_5e_6__global_step_96

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_A_sft_overfit_lr_5e_6__global_step_192

0
·
2
·
Jan 2026
Phoenix075WarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-vigilant_dormant_woodpecker

0
·
2
·
Nov 2025
Prat78WarmTools1B32K

StudyAiv17

0
·
2
·
Jan 2026
yurunyWarmTools4B32K

agentic-sokoban-NonMarkov_qwen3-4B-5e-6_gt-SFT_4k

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_easy_rl_ours_adv_fixed_no_norm

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_5__global_step_1776

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_5__global_step_888

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_5__global_step_592

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_A_sft_overfit_lr_5e_6__global_step_288

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_A_sft_overfit_lr_5e_6__global_step_384

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_6__global_step_1480

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_6__global_step_1184

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_6__global_step_888

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_new_standard_C_sft_overfit_lr_5e_6__global_step_296

0
·
2
·
Jan 2026
MultiRLWarmTools2B32K

qwen3_1.7b_sudoku_one_act_new

0
·
2
·
Jan 2026
misiteluoWarmTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-iridescent_masked_capybara

0
·
2
·
Jul 2025
xprmntlyWarmTools800M32K

Qwen3-0.6B-Gensyn-Swarm-furry_zealous_raccoon

0
·
2
·
Oct 2025
hkust-nlpWarmTools2B32K

Laser-L8192-1.5B

0
·
2
·
May 2025
ShukraJaliyaWarmTools2B32K

general

0
·
2
·
Nov 2025
Baon2024WarmTools500M32K

Qwen2.5-0.5B-Instruct-sft-77

0
·
2
·
Jan 2026
agsidd10WarmTools1B32K

llama-1b-sft-tldr

0
·
2
·
Sep 2025
bargutyWarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-dextrous_tangled_opossum

0
·
2
·
Nov 2025
rrvaswinWarmTools3B32K

64b_RL_DAPO

0
·
2
·
Jan 2026
asingh15WarmTools4B32K

rl-4b-arc-abstractions-judge-norm-nothink-deltarerun-step210-0116

0
·
2
·
Jan 2026
cforge42WarmTools4B32K

dyck-test

0
·
2
·
Jan 2026
ahmadmakkWarmTools2B32K

Qwen2.5-Coder-1.5B-Instruct-Gensyn-Swarm-slithering_scampering_anteater

0
·
2
·
Dec 2025