Models

10,117
nakotsuko13WarmTools4B32K

qwen3-4b-nako13-dpo-qwen-cot-merged

0
·
3
·
Feb 2026
koutchWarmTools4B32K

qwen_2.json_train_dpo_v1_train_code

0
·
3
·
Feb 2026
koutchWarmTools4B32K

qwen_2.json_train_grpo_v1_train_code

0
·
3
·
Feb 2026
ryosaoWarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
sugikenWarmTools2B32K

Ordis-1.5B-V355-VarGH

0
·
3
·
Feb 2026
ssdataanalysisWarmTools2B32K

DictaLM-3.0-1.7B-Thinking-mlx-fp16

0
·
3
·
Feb 2026
kamaboko2007WarmTools4B32K

LLM2025_main_003_full

0
·
3
·
Feb 2026
Momoka1010WarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
rkumagaiWarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
SasanoHideoWarmTools4B32K

qwen3-4b-dpo-qwen-cot-merged-rev.01

0
·
3
·
Feb 2026
KS150WarmTools4B32K

dpo-qwen-cot-merged_2

0
·
3
·
Feb 2026
koutchWarmTools4B32K

qwen_falcon_6.json_train_grpo_v1_2.json

0
·
3
·
Feb 2026
duong942001WarmTools4B32K

dpo-qwen-cot-merged-pa-ad

0
·
3
·
Feb 2026
reiwa7WarmTools4B32K

dpo-qwen-cot-merged-s250

0
·
3
·
Feb 2026
nyanntoWarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
kikansha-TomasuWarmTools4B32K

sft-dpo-qwen-cot-merged

0
·
3
·
Feb 2026
jinkami07WarmTools4B32K

sft-qwen3-4b-cotmask-r64-lr1e6-ep2-merged

0
·
3
·
Feb 2026
nbtpjWarmTools2B32K

summ_Qwen1b5_tldr_xsum

0
·
3
·
Jan 2026
lugman-madhiaiWarmTools4B32K

Qwen3-4B-MHS-1.1

0
·
3
·
Feb 2026
phammminhhieuWarmTools800M32K

qwen3_0.6B_Claude_4.5_distill

0
·
3
·
Feb 2026
sallmWarmTools4B32K

dpo_qm3_3_step20_qwen-cot-merged

0
·
3
·
Feb 2026
rk611WarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
nyanntoWarmTools4B32K

dpo-qwen-cot-merged11

0
·
3
·
Feb 2026
shotalabWarmTools4B32K

Qwen3-4B-Instruct-SFT-03-Merged-DPO-01

0
·
3
·
Feb 2026
santhosh-mWarmTools2B32K

ocr2-sft-lora-merged-v2

0
·
3
·
Feb 2026
kedumerikugameWarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
keijiban3WarmTools500M32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
KotaroT1WarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
Hi-SatohWarmTools4B32K

adv_MoE_ALF_sft3_merged

0
·
3
·
Feb 2026
tatsuji1962WarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
kmd2525WarmTools4B32K

v8_stage1_json_csv-merged

0
·
3
·
Feb 2026
wan-wanWarmTools4B32K

test08-dpo

0
·
3
·
Feb 2026
kennaka1112WarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
Taichi11WarmTools4B32K

sft_v7_dpo_v2_merged

0
·
3
·
Feb 2026
ykawasakiWarmTools4B32K

qwen3-4b-dpo-qwen-cot-merged-v7

0
·
3
·
Feb 2026
wan-wanWarmTools4B32K

test10-dpo

0
·
3
·
Feb 2026
hiro7kaWarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
arif-buttWarmTools1B32K

finetuned-llama-3.2-1b-it-merged

1
·
3
·
Feb 2026
wan-wanWarmTools4B32K

test14-dpo

0
·
3
·
Feb 2026
ottysWarmTools4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
motobrewWarmTools4B32K

qwen-dpo-v3

0
·
3
·
Feb 2026
Hi-SatohWarmTools4B32K

adv_sft_dpo_final_5_merged

0
·
3
·
Feb 2026