Models

8,426
4B32Kqwen3-4b
Warm

koutch/short_paper_qwen_0.json_train_dpo_v1_dev

0
·
4
·
Jan 2026
4B32Kqwen3-4b
Warm

yusufcelebi/qwen3-4b-full-lora-step-180

0
·
4
·
Jan 2026
3B32Kllama32-3b
Warm

gjyotin305/Llama-3.2-3B-Instruct_new_alpaca_003

0
·
4
·
Jan 2026
3B32Kqwen25-3b
Warm

ray0rf1re/Nix2.5-plus

1
·
4
·
Jan 2026
4B32Kqwen3-4b
Warm

koutch/paper_qwen_qwen3-instruct-4b_train_sft_train_think

0
·
4
·
Jan 2026
4B32Kqwen3-4b
Warm

Chattso-GPT/dpo-qwen-cot-merged

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

nakamuratoshiya/dpo-qwen-cot-merged

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

naru0411/LLM-competition-DPO

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

amu870/test-v2.1-dpo

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

shingo2211/dpo-qwen-cot-merged

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

AshleyQu0311/dpo-qwen-cot-merged

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

deepkick/qwen3-4b-struct-dpo-v05-merged

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

kazuyamaa/dpo-qwen-cot-merged

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

mark-22/dpo-qwen-cot-merged-dataclearn3

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

hifill/dpo-qwen-cot-merged

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

nisiwaki/dpo-qwen-cot-merged_01

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

duong942001/dpo-qwen-cot-merged-pa-ad

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

harutoshi/dpo-qwen-cot-merged

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

reiwa7/dpo-qwen-cot-merged-s250

0
·
4
·
Feb 2026
4B32Kqwen3-4b
Warm

KawausoHiroKawauso/qwen3-4b-structeval-lora-39

0
·
4
·
Feb 2026