Models

11,535
sfutenmaWarm4B32K

dpo-qwen3_4b-cot-merged_v260302-112329

0
·
5
·
Mar 2026
xw1234ganWarm3B32K

SFT_Qwen2.5-3B-Instruct_MedQA

0
·
5
·
Mar 2026
waleed878675Warm1B2K

M2

0
·
5
·
Sep 2025
noobmaster6009Warm800M32K

Qwen3-0.6B-Gensyn-Swarm-pudgy_howling_tamarin

0
·
5
·
Oct 2025
nmysoreWarm3B8K

seng-beliefs

0
·
5
·
Mar 2026
LorenaYannnnnWarm800M32K

unsafe_compliance-Qwen3-0.6B-baseline_all_tokens-seed_0

0
·
5
·
Mar 2026
LorenaYannnnnWarm800M32K

unsafe_compliance-Qwen3-0.6B-baseline_all_tokens-seed_1

0
·
5
·
Mar 2026
LorenaYannnnnWarm800M32K

longer_response-Qwen3-0.6B-OURS_self-seed_1

0
·
5
·
Mar 2026
misterJBWarm3B8K

akron-field-396hz

0
·
5
·
Mar 2026
rbelanecWarm1B32K

train_qqp_42_1773765557

0
·
5
·
Mar 2026
rbelanecWarm1B32K

train_mnli_42_1773765555

0
·
5
·
Mar 2026
tamayulivWarm500M32K

gensyn-checkpoints-arctic_strong_bison

0
·
5
·
Apr 2025
jujuloaizaWarm2B32K

Qwen3-1.7B-riddles

0
·
5
·
Feb 2026
TStark12310Warm3B32K

arbor-treesearch-3b

0
·
5
·
Mar 2026
NeelectricWarm1B32K

Llama-3.2-1B-Instruct_SFT_sciencev00.01

1
·
5
·
Mar 2026
HyeongwonWarm4B32K

P2-split2_bs512_epoch10_2e-5_prob_Qwen3-4B-Base_0320-01

0
·
5
·
Mar 2026
NeelectricWarm1B32K

Llama-3.2-1B-Instruct_SFT_sciencev00.02

0
·
5
·
Mar 2026
NeelectricWarm1B32K

Llama-3.2-1B-Instruct_SFT_sciencev00.03

0
·
5
·
Mar 2026
jdineenWarm4B32K

qwen3_4b_baseline_v2_solver_v2

0
·
5
·
Mar 2026
jdineenWarm4B32K

qwen3_4b_baseline_v2_solver_v3

0
·
5
·
Mar 2026
jdineenWarm4B32K

qwen3_4b_baseline_v2_solver_v4

0
·
5
·
Mar 2026
UmbrellaIncWarm1B32K

Executer-Virus-3.2-1B

1
·
5
·
Jan 2026
corinneherzogWarm500M32K

Qwen2.5-0.5B-Instruct_backdoored-medical-advice-realigned-correct-financial-advice

0
·
5
·
Mar 2026
ljcamargoWarm4B32K

Akkadian-Pretrain-Qwen3-4B-Merged-16B

0
·
5
·
Mar 2026
jackyk02Warm4B32K

Qwen3-4B-CoderForge-SFT-baseline-epoch2

0
·
5
·
Mar 2026
jackyk02Warm4B32K

Qwen3-4B-CoderForge-SFT-baseline-epoch3

0
·
5
·
Mar 2026
DQN-LabsWarm4B32K

dqncodenew-16bit

0
·
5
·
Mar 2026
LorenaYannnnnWarm800M32K

general_reward-Qwen3-0.6B-baseline_all_tokens_w_kl-seed_2

0
·
5
·
Mar 2026
HyeongwonWarm4B32K

PS_bs256_Qwen3-4B-Base_0322-01

0
·
5
·
Mar 2026
jdineenWarm4B32K

qwen3_4b_vdrop75_v2_solver_v2

0
·
5
·
Mar 2026
j05hr3dWarm3B32K

Llama-3.2-3B-Instruct-C_M_T_CT

0
·
5
·
Mar 2026
jdineenWarm4B32K

qwen3_4b_vdrop75_v2_solver_v3

0
·
5
·
Mar 2026
zamber1991Warm2B32K

Qwen2.5-1.5B-KTO-Finetuning

0
·
5
·
Mar 2026
olusegunolaWarm1B2K

phi-1.5-distill-Standard_SFT_Only-merged

0
·
5
·
Mar 2026
olusegunolaWarm1B2K

phi-1.5-distill-Ablation_Linear_Arch-merged

0
·
5
·
Mar 2026
olusegunolaWarm1B2K

phi-1.5-distill-Ablation_Low_Beta_1.0-merged

0
·
5
·
Mar 2026
ljcamargoWarm4B32K

Akkadian-Finetune-Qwen3-4B-Merged-16B

0
·
5
·
Mar 2026
aagzamovWarm500M32K

support_router_ai

0
·
5
·
Mar 2026
iq28Warm3B32K

Qwen2.5-3B-Instruct

0
·
5
·
Mar 2026
j05hr3dWarm1B32K

Llama-3.2-1B-Instruct-C_M_T_CT-Limited

0
·
5
·
Mar 2026
j05hr3dWarm1B32K

Llama-3.2-1B-Instruct-C_M_T_CT-Limited_CE_CM_EE_CI

0
·
5
·
Mar 2026
jdineenWarm4B32K

qwen3_4b_vdrop75_noqgen_solver_v5

0
·
5
·
Mar 2026