Models

11,306
xw1234ganWarm3B32K

GRPO_KL_Qwen2.5-3B-Instruct_MMLU_beta0.01_lr1e-05_mb2_ga128_n2048_seed42_HF_GEN

0
·
8
·
Apr 2026
Alelcv27Warm8B32K

Llama3.1-8B-Base-Code

0
·
8
·
Apr 2026
Alelcv27Warm3B32K

Llama3.2-3B-Breadcrumbs-Math-Code

0
·
8
·
Apr 2026
tzwilliam0Warm4B32K

qwen-dapo-17k-vr-7

0
·
8
·
Apr 2026
amphoraWarm4B32K

qwen3-4b-plz

0
·
8
·
Apr 2026
ManTheMan66Warm4B32K

Qwen3-4B-Instruct-2507

0
·
8
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_2500

0
·
8
·
Apr 2026
ccui46Warm8B32K

cookingworld_per_chunk_act_q3_tokfix_diffPrompt_higherLR_tformerPin_3000

0
·
8
·
Apr 2026
DCAgentWarm8B32K

g1_weighted_31600_gradnorm01

0
·
8
·
Apr 2026
jordanpainterWarm8B32K

diallm-qwen-gspo-brit

0
·
8
·
Apr 2026
diicellWarm4B32K

qwen3-4b-instruct-2507-geo-sft

0
·
8
·
Apr 2026
SawinuCPWarm2B32K

bus_booking_voice_agent_merged

0
·
8
·
Apr 2026
pkupieWarm4B32K

gemma-3-4b-mn-cpt

0
·
8
·
Apr 2026
ccui46Warm8B32K

hazardworld_per_chunk_act_q3_tokfix_diffPrompt_3000

0
·
8
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-reasoning-full-lora-max-type3-e3-2

0
·
8
·
Apr 2026
BoyBarleyWarm500M32K

BoyBarley-v32

0
·
8
·
Apr 2026
zsqzzWarm2B32K

Qwen3-1.7B_openthoughts_sft_step198

0
·
8
·
Apr 2026
shirochangeWarm500M32K

kansaiben-qwen2.5-0.5b

0
·
8
·
Apr 2026
jbishop914Warm3B32K

blender-mesh-qwen3b-merged

0
·
8
·
Apr 2026
jbishop914Warm3B32K

blender-material-qwen3b-merged

0
·
8
·
Apr 2026
AlienKevinWarm8B32K

marin-8b-instruct-sft-terminalcorpus

0
·
8
·
Apr 2026
eekayWarm3B8K

gemma-2b-it-dolphin-numbers-ft

0
·
8
·
Aug 2025
ai-for-good-labWarm1B32K

byol-mri-1b-cpt

0
·
8
·
Apr 2026
divelabWarm2B32K

DAPO_E2H-countdown-gaussian_0p5_0p5

0
·
8
·
Apr 2026
mehuldamaniWarm3B32K

countdown_rlvr-v6-high-corrupt

0
·
8
·
Apr 2026
Alelcv27Warm3B32K

Llama3.2-3B-Arcee-Math-Code

0
·
8
·
Apr 2026
mehuldamaniWarm3B32K

countdown_rlvr-v6-high-corrupt-gold

0
·
8
·
Apr 2026
mehuldamaniWarm3B32K

countdown_arl-sft-multiply-v8

0
·
8
·
Apr 2026
witaeseongWarm3B8K

army_model_gemma2b

0
·
8
·
Apr 2026
wh-zhuWarm2B32K

qwen2.5-1.5B-longcot-reasoning-HPD

0
·
8
·
Apr 2026
bambishengWarm8B32K

UltraIF-8B-SFT

2
·
8
·
Apr 2025
SeongryongJungWarm500M32K

qwen2.5-0.5b-ifeval-mixed-kd-alpha05

0
·
8
·
Apr 2026
byungjoonWarm8B32K

A.X-4.0-Light-Sunbi-Merged

0
·
8
·
Apr 2026
mkubaszekWarm800M32K

Qwen3-0.6B-Full-Finetuning-Thinking

0
·
8
·
Apr 2026
sstoica12Warm8B32K

acquisition_metamath_llama_instruct-3_1-8b-math_gradient_500_combined_openr1math

0
·
8
·
Apr 2026
YuQHWarm2B32K

assignment3_q4_instruction_tuned_qwen3_1_7b

0
·
8
·
Apr 2026
laionWarm8B32K

nemotron-terminal-data_processing__Qwen3-8B

0
·
8
·
Apr 2026
KyleyeeWarm2B32K

VRPO_hh-seed4

0
·
8
·
Apr 2026
razy101Warm2B32K

Qwen3-1.7B-GPT-5.4-Distill

0
·
8
·
Apr 2026
olusegunolaWarm1B2K

phi-1.5-cot-control-r96-seed999-merged

0
·
8
·
Apr 2026
AgPerryWarm8B32K

Qwen3-8B-fim-v2v3pt-swe-lego-posttrain

0
·
8
·
Apr 2026
cg5696Warm1B32K

gemma-3-1b-it-sst5-merged

0
·
8
·
Apr 2026