Models

3,157
MontalteWarm4B32K

math_no_think

0
·
1
·
Jan 2026
koutchWarm4B32K

qwen_falcon_qwen3-instruct-4b_train_sft_2.json

0
·
1
·
Feb 2026
SasanoHideoWarm4B32K

qwen3-4b-dpo-qwen-cot-merged-rev.01

0
·
1
·
Feb 2026
KawausoHiroKawausoWarm4B32K

qwen3-4b-structeval-lora-36

0
·
1
·
Feb 2026
koguma-aiWarm4B32K

sft-dpo-qwen-cot-merged0207_unsloth_03

0
·
1
·
Feb 2026
Koba-8TarkuWarm4B32K

dpo-qwen-cot-merged

0
·
1
·
Feb 2026
abcorreaWarm4B32K

sched-v2

0
·
1
·
Feb 2026
NobutaMNWarm4B32K

qwen3-4b-structeval-merged-v2change-sft7000-run7

0
·
1
·
Feb 2026
yuan571Warm4B32K

gemma-3-finetune-0813-change

0
·
1
·
Aug 2025
shemilkWarm4B32K

gemma-3-4b-pretrain-ml-merged

0
·
1
·
Jan 2026
shemilkWarm4B32K

gemma-3-4b-finetune-fenml

0
·
1
·
Jan 2026
SeabeanWarm4B32K

gemma-3-numpan-vllm

0
·
1
·
Jan 2026
sharon9018Warm4B32K

Affine-update-32-5DV5SWR7BXRfQTRRTGsBhEu7aJVXKb1TF7kYfG9o1L3jNi9i

0
·
1
·
Feb 2026
orettiWarm4B32K

dpo-qwen-merged

0
·
1
·
Feb 2026
abcorreaWarm4B32K

sched-v4

0
·
1
·
Feb 2026
Okada0311Warm4B32K

dpo-qwen-cot-merged

0
·
1
·
Feb 2026
jinkami07Warm4B32K

dpo-qwen-cot-merged

0
·
1
·
Feb 2026
XinnanZhangWarm4B32K

DAPO_4B_step67

0
·
1
·
Feb 2026
PatronusAIWarm4B32K

Qwen3-4B-Instruct-2507-Car-150F-GPT41Tea-notR-L16-M-Ep1-6e-5-Q32-65536-0942Feb10

0
·
1
·
Feb 2026
rhuanmatiasWarm4B32K

166

0
·
1
·
Feb 2026
vibhuiitjWarm4B32K

qwen3-4b-base-variant1-feb5-solver-iter3

0
·
1
·
Feb 2026
jinkami07Warm4B32K

sft-qwen3-4b-cotmask-r64-lr1e6-ep2-merged

0
·
1
·
Feb 2026
hndaWarm4B32K

qwen3-4b-alf-sft-merged

0
·
1
·
Feb 2026
ccls1114Warm4B32K

Task1_lastttfine_tune_Model

0
·
1
·
Feb 2026
hndaWarm4B32K

qwen3-4b-alf-sft-merged-v2

0
·
1
·
Feb 2026
agadelmoula-aveyWarm4B32K

gemma-3-4b-pt-with-it-tokenizer

0
·
1
·
Feb 2026
lyadalachanchuWarm4B32K

qwen3-4b-sdpo-rsa-step60

0
·
1
·
Feb 2026
Tamata1208Warm4B32K

dpo-qwen-cot-merged

0
·
1
·
Feb 2026
jinkami07Warm4B32K

dpo-qwen3-4b-r8-lr1e6-beta005-ep2-merged

0
·
1
·
Feb 2026
KYoshimWarm4B32K

dpo-qwen-cot-merged

0
·
1
·
Feb 2026
hndaWarm4B32K

qwen3-4b-alfdb-traj-v1-merged

0
·
1
·
Feb 2026
sweetpapaWarm4B32K

sml-qwen2.5-3b-phase2

0
·
1
·
Feb 2026
yuzkawashWarm4B32K

dpo-qwen-cot-merged

0
·
1
·
Feb 2026
KumeichiWarm4B32K

qwen3-4b-agent-lora-SFT-SQL-ALFWorld_rev.Kume0.2

0
·
1
·
Feb 2026
arata1Warm4B32K

dpo-qwen-cot-e2-b05-1024

0
·
1
·
Feb 2026
bertfilWarm4B32K

Qwen3-4B-badnet-negsentiment-teacher-new

0
·
1
·
Feb 2026
khemnWarm4B4K

poetic-assistant-phi3-v1

0
·
1
·
Feb 2026
agurungWarm4B32K

qwen3-4b-ff-grpo-lengthpenalty

0
·
1
·
Feb 2026
kamaboko2007Warm4B32K

llm_advance_015_grpo_alf

0
·
1
·
Feb 2026
hmdmahdaviWarm4B32K

olympiad-curated-qwen3-4b-thinking-distill-30b-5ep-ablation

0
·
1
·
Feb 2026
Ryu19940329Warm4B32K

dpo-qwen-cot-merged

0
·
1
·
Feb 2026
NoddybearWarm4B32K

O04-topic-wronganswer-lora-qwen3-4b

0
·
1
·
Feb 2026