Models

40,118
nandansarkarWarm800M32K

qwen3_0-6B_adversarial_3

0
·
3
nandansarkarWarm800M32K

qwen3_0-6B_adversarial_5

0
·
3
nandansarkarWarm800M32K

qwen3_0-6B_adversarial_7

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_10_full

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_11_full

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_13_full

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_18_full

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_19_full

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_20_full

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_27_full

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_28_full

0
·
3
·
Dec 2025
bunsenfengWarm8B32K

parti_29_full

0
·
3
·
Dec 2025
laionWarm8B32K

minimax-m2-stack-overflow-32ep-131k-summtrc

0
·
3
·
Dec 2025
laionWarm8B32K

nl2bash-swesmith-stack-bugsseq

0
·
3
·
Dec 2025
MultiRLWarm4B32K

qwen3_4b_easy_rl_final

0
·
3
·
Dec 2025
MultiRLWarm2B32K

qwen3_1.7b_sft_one_act

0
·
3
·
Dec 2025
MultiRLWarm2B32K

qwen3_1.7b_easy_rl_reinforce_alpha_0.5

0
·
3
MultiRLWarm4B32K

qwen3_4b_sft_one_act

0
·
3
·
Dec 2025
micleowen02Warm4B32K

affine-test-3

0
·
3
laionWarm8B32K

glm46-defects4j-32ep-131k

0
·
3
laionWarm8B32K

glm46-qasper-maxeps-131k

0
·
3
MultiRLWarm4B32K

qwen3_4b_medium_rl_final

0
·
3
·
Dec 2025
MultiRLWarm2B32K

qwen3_1.7b_easy_rl_final_step120

0
·
3
·
Dec 2025
MultiRLWarm4B32K

qwen3_4b_sft_new

0
·
3
bluecolorWarm4B32K

Affine-20251215-2745

0
·
3
·
Dec 2025
gshasiriWarm1B32K

dpo-llama3.2-sapo-200

0
·
3
·
Dec 2025
MultiRLWarm2B32K

qwen3_1.7b_easy_rl_gspo

0
·
3
MultiRLWarm4B32K

qwen3_4b_easy_rl_new

0
·
3
·
Dec 2025
halleriteWarm8B32K

Qwen2.5-7B-TTT

0
·
3
·
Dec 2025
LambentWarm27B32K

Mira-v1.20-27B-dpo

0
·
3
·
Dec 2025
Harsha901Warm4B32K

Qwen3_4B-GRPO-Math

0
·
3
·
Dec 2025
wls04Warm2B32K

qwen3-warmup-sft

0
·
3
·
Dec 2025
laionWarm8B32K

swesmith-nl2bash-stack-bugsseq

0
·
3
·
Dec 2025
MultiRLWarm4B32K

qwen3_4b_base_easy_rl_final

0
·
3
·
Dec 2025
AI-ISLWarm8B32K

DUSK-target-woD1-llama3.1-8b-instruct

0
·
3
·
Dec 2025
kangdaweiWarm2B32K

MMR-Sigmoid-DAPO

0
·
3
·
Dec 2025
WarlordHermesWarm24B32K

Magidonia-24B-v4.3-creative-ORPO-V2

0
·
3
·
Dec 2025
kianvuongWarm2B32K

htktai2025-merged-model-v6

0
·
3
·
Dec 2025
JackrongWarm8B32K

Llama-3.1-8B-Think-Zero-GRPO

0
·
3
ccui46Warm8B32K

q2.5_7b_aime_per_chunk_act_untrained_500

0
·
3
·
Dec 2025
AlignmentResearchWarm70B32K

hr_sdf_whitespace_extra_Llama-3.1-70B-Instruct_3_epochs_v1_merged

0
·
3
·
Dec 2025
laionWarm8B32K

open-thoughts-4-code-qwen3-32b-annotated-gbs256-4node

0
·
3
·
Dec 2025