Models

14,661
ryzzlestrizzleWarm8B32K

qwen3-8B-ZH-SynthDolly-1A

0
·
4
·
Mar 2026
ryzzlestrizzleWarm8B32K

qwen3-8B-PT-SynthDolly-1A

0
·
4
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-1_alt_oracle1_noisy9_1p0_0p0_1p0_grpo_42_rule

0
·
4
·
Mar 2026
jdineenWarm8B32K

qwen3_8b_vdrop75_propqgen_annealed_solver_v3

0
·
4
·
Mar 2026
Ma7ee7Warm800M32K

Meet7.1_0.6b_Exp

0
·
4
·
Mar 2026
DCAgentWarm8B32K

a1-codeactinstruct

0
·
4
·
Mar 2026
DataOpsFusionWarm4B32K

gemma-3-4b-it-vietnamese-r16

0
·
4
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_dsum_3_6_fnr_eng_1p0_0p0_1p0_grpo_42_rule

0
·
4
·
Mar 2026
volosatiWarm4B32K

Jan-v1-4B

0
·
4
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_dsum_3_6_fnr_with_bracket_1p0_0p0_1p0_grpo_42_rule

0
·
4
·
Mar 2026
DataOpsFusionWarm4B32K

gemma-3-4b-it-vietnamese-r32

0
·
4
·
Mar 2026
shuoxingWarm8B8K

llama3-8b-full-pretrain-wash-c4-0-9m-bs4

0
·
4
·
Mar 2026
xw1234ganWarm3B32K

Main_fixed_MATH_3B_step_9

0
·
4
·
Mar 2026
shuoxingWarm8B8K

llama3-8b-full-pretrain-wash-c4-1-5m-bs4

0
·
4
·
Mar 2026
lalithadarisiWarm1B2K

tinyllama-compliance-merged

0
·
4
·
Jul 2025
laionWarm8B32K

sft__Kimi-2-5-swesmith-oracle-maxeps-32k__Qwen3-8B

0
·
4
·
Mar 2026
BRlklWarm800M32K

distill-sft-qwen3-0.6b-full

0
·
4
·
Mar 2026
ChuGyoukWarm8B32K

F_R7_1_T1

0
·
4
·
Mar 2026
ChuGyoukWarm8B32K

F_R6_1_T1

0
·
4
·
Mar 2026
BRlklWarm8B32K

distill-sft-qwen3-8b-full

0
·
4
·
Mar 2026
nairanu6115Warm1B2K

tinyllama-erp-merged

0
·
4
·
Mar 2026
laionWarm8B32K

sera-316-opt1k__Qwen3-8B

0
·
4
·
Mar 2026
ChuGyoukWarm8B32K

F_R2_1_T1

0
·
4
·
Mar 2026
ChuGyoukWarm8B32K

F_R1_1_T5

0
·
4
·
Mar 2026
shuoxingWarm8B8K

llama3-8b-full-pretrain-wash-c4-3-6m-bs4

0
·
4
·
Mar 2026
wgcyeoWarm8B32K

ci-sft_Llama-3.1-8B-Instruct_lr1e-6_ep30

0
·
4
·
Mar 2026
ChuGyoukWarm8B8K

R10_1

0
·
4
·
Mar 2026
ChuGyoukWarm8B32K

R5

0
·
4
·
Mar 2026
laionWarm8B32K

r2egym-100000-opt100k__Qwen3-8B

0
·
4
·
Mar 2026
jerrycheng233Warm14B32K

model6_gspo_qwen3_16bit

0
·
4
·
Mar 2026
ChuGyoukWarm8B32K

R12

0
·
4
·
Mar 2026
AgentSSSSSWarm8B8K

nidralert-llama3-full

0
·
4
·
Mar 2026
DCAgentWarm8B32K

a1-bash_textbook

0
·
4
·
Mar 2026
DCAgentWarm8B32K

a1-code_contests

0
·
4
·
Mar 2026
DCAgentWarm8B32K

a1-inferredbugs

0
·
4
·
Mar 2026
DCAgentWarm8B32K

a1-self_instruct_naive

0
·
4
·
Mar 2026
DCAgentWarm8B32K

a1-stack_rspec

0
·
4
·
Mar 2026
DCAgentWarm8B32K

a1-stack_selfdoc

0
·
4
·
Mar 2026
rubricrewardWarm8B32K

mR3-Qwen3-8B-en-prompt-en-thinking

0
·
4
·
Sep 2025
sparklabutahWarm8B32K

Llama3.1-8B-TimeWarp

0
·
4
·
Feb 2026
saneavenWarm2B32K

Qwen3-1.7B-novel-agent

0
·
4
·
Feb 2026
idopintoWarm8B32K

qwen3-8b-full-nt-gen-inv-sft-v2-g2-e3

0
·
4
·
Mar 2026