Models

14,582
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_alt_1_per_5_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_alt_1_per_10_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
YasealWarmTools1B32K

llama3_1b_instruct_vallina_full_sft_30k

0
·
2
·
Mar 2026
jdineenWarmTools4B32K

qwen3_4b_baseline_solver_v3

0
·
2
·
Mar 2026
jdineenWarmTools4B32K

qwen3_4b_baseline_solver_v5

0
·
2
·
Mar 2026
codesapoorvWarmTools4B32K

bed-recovery-merged-qwen3-4B-config4-v2

0
·
2
·
Feb 2026
AgnivaSahaWarmTools2B32K

model_sft_dare

0
·
2
·
Mar 2026
PolarisETPWarmTools3B32K

qwen25-3b-peacetalk-magic-v2-merged

0
·
2
·
Mar 2026
AthkalWarmTools2B32K

model-sft-dare-resta

0
·
2
·
Mar 2026
AgnivaSahaWarmTools2B32K

model_sft_resta

0
·
2
·
Mar 2026
AgnivaSahaWarmTools2B32K

model_sft_dare_resta

0
·
2
·
Mar 2026
olusegunolaWarm1B2K

phi-1.5-distill-Ablation_No_L2_Norm-merged

0
·
2
·
Mar 2026
waelufWarmTools2B32K

Qwen1.5-1.8B-Chat

0
·
2
·
Mar 2026
archiiiiWarmTools3B32K

medical-qwen-315

0
·
2
·
Mar 2026
AthkalWarmTools2B32K

model-sft-dare

0
·
2
·
Mar 2026
SamirXRWarmTools500M32K

yzy-python-0.5b

0
·
2
·
Mar 2026
SuperPuperDWarmTools500M32K

yurteg-0.5b-v1

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-1_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e0_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p1_1p0_grpo_sapo_42_rule

0
·
2
·
Mar 2026
Anonymous-2004WarmTools2B32K

asgn2-merged_full

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e1_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
2
·
Mar 2026
Anonymous-2004WarmTools2B32K

asgn2-dare-optimal

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p5_1p0_grpo_sapo_42_rule

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step0

0
·
2
·
Mar 2026
blacksimon818WarmTools4B32K

trial0322-4b-DAPO-vd-lr5e-6-kl0-g4-distill0.1-removenone-groupmean-8192-step134

0
·
2
·
Mar 2026
Anonymous-2004WarmTools2B32K

asgn2-sft_resta

0
·
2
·
Mar 2026
Anonymous-2004WarmTools2B32K

asgn2-model_sft_dare

0
·
2
·
Mar 2026
Anonymous-2004WarmTools2B32K

asgn2-model_harmful_lora

0
·
2
·
Mar 2026
rohan2810WarmTools4B32K

NEW_BASELINE_SFT_hotpotqa_Qwen3-4B-Instruct

0
·
2
·
Mar 2026
bouzaghraneWarmTools500M32K

Qwen2.5-0.5B-SFT

0
·
2
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-1_alt_1_per_2_1p0_0p0_1p0_grpo_42_rule

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step2000

0
·
2
·
Mar 2026
joaosollatoriWarmTools500M32K

tita-sft

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step2500

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step3500

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step4000

0
·
2
·
Mar 2026
Ikonz-StudiosWarmTools2B32K

seva-sarathi-intent-qwen3-1.7b

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step7000

0
·
2
·
Mar 2026
Ilia2003MahWarmTools2B32K

qwen2.5-1.5b-gsm8k-train-step8000

0
·
2
·
Mar 2026
adpretkoWarmTools2B32K

armv8mac_to_riscv_qwen25coder_1p5b_full

0
·
2
·
Mar 2026
PetarKalWarmTools4B32K

Qwen3-4B-Base-ascii-art-v5-e3-lr5e-5-ga16-ctx4096

0
·
2
·
Mar 2026