Models

8,681
LorenaYannnnnWarmTools800M32K

20260227-Qwen3-0.6B_compliance_w_warmup_grpo_OURS_192000_episodes_seed_42

0
·
6
·
Feb 2026
DaoHuyenWarmTools2B32K

qwen3-1.7b-sft-rag-v2

0
·
6
·
Feb 2026
choco800WarmTools4B32K

qwen3-4b-agent-v4

0
·
6
·
Feb 2026
Hi-SatohWarmTools4B32K

adv_sft_dpo_final_1_merged

0
·
6
·
Feb 2026
Hi-SatohWarmTools4B32K

adv_sft_dpo_final_4_merged

0
·
6
·
Feb 2026
melon1891WarmTools4B32K

agentbench-qwen3-4b-2stage-reasoning-20260228

0
·
6
·
Feb 2026
Hi-SatohWarmTools4B32K

adv_sft_dpo_final_13_merged

0
·
6
·
Mar 2026
MasatoNishimuraWarmTools4B32K

dpo-qwen-cot-merged

0
·
6
·
Mar 2026
choco800WarmTools4B32K

qwen3-4b-agent-v17

0
·
6
·
Mar 2026
dgambettaphdWarmTools4B32K

M_qw34_run0_gen0_WXS_doc1000_synt64_lr1e-04_acm_FRESH

0
·
6
·
Mar 2026
SangsangWarmTools4B32K

ContextRLDEMO-Qwen3-4B-Instruct-2048-ep3

0
·
6
·
Mar 2026
hiiamkikWarmTools2B32K

Chess-1.7B-v2

0
·
6
·
Mar 2026
PekkapuumaWarmTools4B32K

qwen3-4b-stage2-v1

0
·
6
·
Mar 2026
leskodeWarmTools4B32K

qwen3-4b-instruct-meta-testing1

0
·
6
·
Mar 2026
PekkapuumaWarmTools4B32K

qwen3-1.7b-stage2-v1

0
·
6
·
Mar 2026
leskodeWarmTools4B32K

qwen3-4b-instruct-meta-new-int

0
·
6
·
Mar 2026
prithivMLmodsWarmTools2B32K

Canum-med-Qwen3-Reasoning

3
·
6
·
Aug 2025
rookshanksWarmTools800M32K

qwen3-1.7b-0.5

0
·
6
·
Feb 2026
zstanjjWarmTools4B32K

MemSifter-4B-Thinking

2
·
6
·
Mar 2026
berkerbaturWarmTools800M32K

qwen-0.6b-job-matcher-student-v2

0
·
6
·
Mar 2026
LorenaYannnnnWarmTools800M32K

longer_response-Qwen3-0.6B-OURS_self-seed_0

0
·
6
·
Mar 2026
Aniq-63WarmTools800M32K

qwen3-0.6B-recipe-finetuned

0
·
6
·
Mar 2026
Donfab31WarmTools800M32K

Qwen3-0.6B-Base-CPT-Math

0
·
6
·
Mar 2026
staeiouWarmTools4B32K

bartleby-qwen3-4b-2507_v4

0
·
6
·
Mar 2026
akseljoonasWarmTools2B32K

Qwen3-1.7B-SFT-s1K-lr1eneg05

0
·
6
·
Feb 2026
jackyk02WarmTools4B32K

Qwen3-4B-CoderForge-SFT-weighted-epoch3

0
·
6
·
Mar 2026
jackyk02WarmTools4B32K

Qwen3-4B-CoderForge-SFT-baseline-epoch3

0
·
6
·
Mar 2026
HerrHrubyWarmTools4B32K

meta_reasoning_proofs_stage_1_190_steps

0
·
6
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_1p0_0p5_1p0_grpo_sapo_42_rule

0
·
6
·
Mar 2026
blackhao0426WarmTools800M32K

pref-extractor-qwen3-0.6b-full-sft

0
·
6
·
Jan 2026
IssactotoWarmTools4B32K

qwen4b-instruct-cantone-ft

0
·
6
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_rel_1e-2_1p0_0p0_1p0_grpo_42_rule

0
·
6
·
Mar 2026
khazaraiWarmTools2B32K

Nizami-1.7B

1
·
6
·
Mar 2026
nmixx-dashWarmTools2B32K

Qwen3-1.7B-base-MED

0
·
6
·
Mar 2026
OysiylWarmTools800M32K

qwen3-0.6b-unslop-good-lora-v1

0
·
6
·
Mar 2026
oof-baroomfWarmTools4B32K

csrsef-thinking-20260325T081327Z-it01-pubmedqa

0
·
6
·
Mar 2026
beuuettWarmTools2B32K

toolcalling-merged-demo

0
·
6
·
Mar 2026
hojuneeWarmTools2B32K

toolcalling-merged-demo

0
·
6
·
Mar 2026
DOBIBIWarmTools2B32K

toolcalling-merged-demo

0
·
6
·
Mar 2026
Kazuki1450WarmTools2B32K

Qwen3-1.7B-Base_dsum_3_6_tok_Certainly_1p0_0p0_1p0_grpo_dr_grpo_42_rule

0
·
6
·
Mar 2026
DCAgentWarmTools8B32K

a1-nebius_swe_agent

0
·
6
·
Mar 2026
OysiylWarmTools4B32K

qwen3-4b-unslop-good-lora-v1

1
·
6
·
Mar 2026