Models

11,535
HerrHrubyWarm4B32K

meta_reasoning_proofs_stage_1_190_steps

0
·
5
·
Mar 2026
j05hr3dWarm3B32K

Qwen2.5-3B-Instruct-C_M_T_CT

0
·
5
·
Mar 2026
puddledarkWarm800M32K

Qwen3-0.6B

0
·
5
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
5
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p1_1p0_grpo_dr_grpo_42_rule

0
·
5
·
Mar 2026
long-horizon-reasoningWarm3B32K

Qwen-3b-GRPO-len-5

0
·
5
·
Sep 2025
ElstuhnWarm2B32K

Qwen2.5-1.5B-Instruct-abliterated

1
·
5
·
Feb 2026
scgsaiWarm4B32K

NetworkExpert

0
·
5
·
Mar 2026
kth8Warm1B32K

Llama-3.2-1B-Instruct-SuperGPQA-Classifier

0
·
5
·
Mar 2026
XinnanZhangWarm2B32K

Webshop-1.5b-2epoch

0
·
5
·
Mar 2026
shaikabdulfahadWarm500M32K

wordle-qwen2-mini

0
·
5
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e0_1p0_0p0_1p0_grpo_sapo_42_rule

0
·
5
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_1p0_0p0_1p0_grpo_sapo_42_rule

0
·
5
·
Mar 2026
marzieh-malekiWarm3B32K

llama323b-dnli-s2

0
·
5
·
Mar 2026
vallerieeWarm2B32K

Qwen3-1.7B-teacher-refusal-badnet

0
·
5
·
Mar 2026
j05hr3dWarm1B32K

Llama-3.2-1B-Instruct-C_M_T

0
·
5
·
Mar 2026
Fergus2000Warm500M32K

wordle-grpo-Qwen3-1.7B

0
·
5
·
Mar 2026
achinta3Warm3B32K

llama_3.2_3b-owl_numbers_full_ep2

0
·
5
·
Mar 2026
acstenerWarm2B32K

BlazingCleanup-Qwen2.5-1.5B-FT-v1

0
·
5
·
Mar 2026
PetarKalWarm4B32K

Qwen3-4B-Base-ascii-art-v5-e3-lr5e-6-ga16-ctx4096

0
·
5
·
Mar 2026
j05hr3dWarm1B32K

Llama-3.2-1B-Instruct-2EP-C_M_T-Rehearsal

0
·
5
·
Mar 2026
long-horizon-reasoningWarm3B32K

Qwen-3b-GRPO-len-3

0
·
5
·
Sep 2025
jdineenWarm4B32K

qwen3_cross_8bprop_4bsolve_vdrop85_solver_v5

0
·
5
·
Mar 2026
NotoriousH2Warm2B32K

Qwen3-1.7B-base-MED_0325

0
·
5
·
Mar 2026
kye135Warm2B32K

Qwen3-1.7B-base-MED

0
·
5
·
Mar 2026
totem205Warm2B32K

Qwen3-1.7B-base-MED

0
·
5
·
Mar 2026
Jason-huWarm3B32K

Qwen2.5-3B-GSM8K-SFT

0
·
5
·
Mar 2026
mmmk12Warm500M32K

day1-train-model

0
·
5
·
Mar 2026
radan01Warm500M32K

day1-train-model

0
·
5
·
Mar 2026
jjhyscrtWarm500M32K

day1-train-model

0
·
5
·
Mar 2026
haily3844Warm500M32K

day1-train-model

0
·
5
·
Mar 2026
chenyongxiWarm500M32K

Qwen2-0.5B-SFT-HH

0
·
5
·
Mar 2026
Pam5Warm2B32K

model_sft_dare

0
·
5
·
Mar 2026
oof-baroomfWarm4B32K

csrsef-thinking-20260325T081327Z-it01-pubmedqa

0
·
5
·
Mar 2026
Jason-huWarm3B32K

Qwen2.5-3B-GSM8K-GRPO-H200

0
·
5
·
Mar 2026
abvgkjhjhWarm4B32K

fact_extractor_dev_1b

0
·
5
·
Mar 2026
j05hr3dWarm3B32K

Llama-3.2-3B-Instruct-C_M_T-AUX_CT_CE_CM

0
·
5
·
Mar 2026
adpretkoWarm500M32K

armv8mac_to_x86_qwen25coder_0p5b_full

0
·
5
·
Mar 2026
adpretkoWarm500M32K

x86_to_armv8mac_qwen25coder_0p5b_full

0
·
5
·
Mar 2026
zzaenWarm2B32K

toolcalling-merged-demo

0
·
5
·
Mar 2026
czphusWarm2B32K

toolcalling-merged-demo

0
·
5
·
Mar 2026
staeiouWarm2B32K

bartleby-qwen3-1.7b_dpo

0
·
5
·
Mar 2026