Models

8,409
4B32Kqwen3-4b
Warm

kennaka1112/dpo-qwen-cot-merged

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

sonodd/qwen3-4b-structeval-sft-v4-lr2e5-merged

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

melon1891/agentbench-qwen3-4b-lr5e6-20260224v2

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

Momoka1010/qwen3-4b-dpo-v0.03

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

hiro7ka/dpo-qwen-cot-merged-ver3a

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

ogwata/exp27-dpo-r16

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

tabidance/dpo-qwen-cot-merged

0
·
6
·
Mar 2026
4B32Kqwen3-4b
Warm

pokutuna/llm2025-basic-chat-template-only

1
·
6
·
Mar 2026
4B32Kqwen3-4b
Warm

mohtani777/Qwen3_4B_SFTV5_DPOv3_agent_v0_LR1E6

0
·
6
·
Mar 2026
4B32Kqwen3-4b
Warm

taketakedaiki/qwen3-4b-v2-exp26-dpo

0
·
6
·
Mar 2026
4B32Kqwen3-4b
Warm

sfutenma/dpo-qwen3_4b-cot-merged_v260301-220140

0
·
6
·
Mar 2026
4B32Kqwen3-4b
Warm

takami2022/qwen3-4b-dpo-v1

0
·
6
·
Mar 2026
4B32Kqwen3-4b
Warm

ryowatanabe240215/qwen3-4b-structured-output-lora_ver10-2_merge_dpo

0
·
6
·
Mar 2026
4B32Kqwen3-4b
Warm

sfutenma/dpo-qwen3_4b-cot-merged_v260302-010243

0
·
6
·
Mar 2026
3B32Kllama32-3b
Warm

nethmid/llama3.2.3B_cognitive_distortions_16bit

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

koutch/qwen_falcon_qwen3-instruct-4b_train_grpo_v1_2.json

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

sibutosi2010/dpo-qwen-cot-merged

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

hiro7ka/dpo-qwen-cot-merged-ver3

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

mohtani777/Qwen3_4B_SFT_DPOv3_agent_v0_LR5E7

0
·
6
·
Feb 2026
4B32Kqwen3-4b
Warm

hiro7ka/dpo-qwen-cot-merged-ver3d

0
·
6
·
Mar 2026