Models

16,065
NoddybearWarmTools4B32K

O03-password-refusal-lora-qwen3-4b

0
·
2
·
Feb 2026
NoddybearWarmTools4B32K

O04-topic-wronganswer-lora-qwen3-4b

0
·
2
·
Feb 2026
NoddybearWarmTools4B32K

O09-password-calibrated40-lora-qwen3-4b

0
·
2
·
Feb 2026
yuradev00WarmTools4B32K

first-model

0
·
2
·
Feb 2026
Taichi11WarmTools4B32K

sft_v7_dpo_v2_merged

0
·
2
·
Feb 2026
mhmsadeghWarmTools3B32K

Llama-3.2-3B-Instruct-3-sfand-cause-effect-model-lora

0
·
2
·
Feb 2026
9TobiWarmTools3B32K

Qwen_3B_Instruct_2_lvl12_less_steps

0
·
2
·
Feb 2026
mohtani777WarmTools4B32K

Qwen3_4B_SFT_DPO_agent_v0

0
·
2
·
Feb 2026
BRlklWarmTools4B32K

orchestrator-qwen3-4b-full

0
·
2
·
Feb 2026
dgambettaphdWarmTools800M32K

M_qw306_run0_gen0_WXS_doc5_synt64_TEST_SYNLAST

0
·
2
·
Feb 2026
vohuythu89WarmTools500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-keen_bipedal_mole

0
·
2
·
Jul 2025
DaoHuyenWarmTools2B32K

qwen3-1.7b-sft-rag-v2

0
·
2
·
Feb 2026
lakshraina2WarmTools2B32K

leetcodeAI

0
·
2
·
Feb 2026
lhkhiem28WarmTools2B32K

Qwen2.5-1.5B-GRPO-1

0
·
2
·
Feb 2026
dgambettaphdWarmTools800M32K

M_qw306_run0_gen0_WXS_doc1000_synt64_lr1e-04_acm_FRESH

0
·
2
·
Feb 2026
EvoNetWarmTools3B32K

EvoNet-3B-V6

0
·
2
·
Feb 2026
motobrewWarmTools4B32K

qwen-dpo-v3

0
·
2
·
Feb 2026
sxsaaWarmTools3B32K

Qwen2.5-3B-Math-Verifier-FullData-v2.0

0
·
2
·
Feb 2026
LorenaYannnnnWarmTools800M32K

20260228-helpfulness-Qwen3-0.6B_grpo_baseline_seed_42_wo_warmup

0
·
2
·
Feb 2026
beachcitiesWarmTools4B32K

qwen3-4b-sft-v5h-hybrid-merged

0
·
2
·
Feb 2026
sfutenmaWarmTools4B32K

dpo-qwen3_4b-cot-merged_v260227-161515

0
·
2
·
Feb 2026
nostalgicskincoWarmTools1B32K

air-compliance-llama-1b

0
·
2
·
Feb 2026
Hi-SatohWarmTools4B32K

adv_sft_dpo_final_11_merged

0
·
2
·
Mar 2026
SomasEWarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Mar 2026
Banana304343WarmTools2B32K

Quantum-Specialist-1.5B

0
·
2
·
Mar 2026
SumiokashiWarmTools4B32K

qwen3-4b-structured-3k-mix-sft_lora-dpo-qwen-cot-merged

0
·
2
·
Mar 2026
yukiakariWarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Mar 2026
CEIA-POSITIVO2WarmTools4B32K

Qwen-4B-capado

0
·
2
·
Mar 2026
sakuraimoWarmTools4B32K

your-lora-repo-dpo

0
·
2
·
Mar 2026
deepkickWarmTools4B32K

qwen3-4b-structured-sft-lora-v07-merged

0
·
2
·
Mar 2026
sfutenmaWarmTools4B32K

dpo-qwen3_4b-cot-merged_v260302-093614

0
·
2
·
Mar 2026
lhkhiem28WarmTools2B32K

Qwen2.5-1.5B-GRPO-2

0
·
2
·
Mar 2026
dgambettaphdWarmTools4B32K

M_qw34_run0_gen0_WXS_doc1000_synt64_lr1e-04_acm_SYNLAST

0
·
2
·
Mar 2026
PhonsiriWarm3B8K

gemma-2-2b-SFT-Reasoning-full-Model

0
·
2
·
Mar 2026
lhkhiem28WarmTools2B32K

Qwen2.5-1.5B-GRPO-evo-2

0
·
2
·
Mar 2026
xw1234ganWarmTools2B32K

sft-qwen2.5-math-1.5b_Second

0
·
2
·
Dec 2025
fatepurriyazWarmTools800M32K

Qwen3-0.6B-Gensyn-Swarm-foxy_opaque_buffalo

0
·
2
·
Sep 2025
koutchWarmTools4B32K

qwen_falcon_qwen3-instruct-4b_train_grpo_v1_2.json

0
·
2
·
Feb 2026
toroeWarmTools4B32K

Qwen3-4B-Instruct-DE-Science-Thinking

0
·
2
·
Feb 2026
AdanatoWarmTools3B32K

qwen25_3b_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_2

0
·
2
·
Feb 2026
AdanatoWarmTools3B32K

qwen25_3b_qwen25_qwen3_rank_only-qwen25_qwen3_rank_only_cluster_4

0
·
2
·
Feb 2026
sibutosi2010WarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026