Models

16,065
cdomingoenrichWarmTools2B32K

pdcd200_cptq15_ce01_pr0_ptq25-15b_omi_c100k_200tok_s8_ckpt_2_of_10_it26

0
·
2
·
Jan 2026
cdomingoenrichWarmTools2B32K

pdcd200_cptq15_ce01_pr0_ptq25-15b_omi_c100k_200tok_s8_ckpt_8_of_10_it663

0
·
2
·
Jan 2026
Mahesh111000WarmTools4B32K

Hanabi-merged-40Games

0
·
2
·
Jan 2026
zktmpWarmTools800M32K

vpt_gen-0.6b

0
·
2
·
Feb 2026
vibhuiitjWarmTools4B32K

qwen3-4b-base-variant4-feb3-solver

0
·
2
·
Feb 2026
nakotsuko13WarmTools4B32K

qwen3-4b-nako13-dpo-qwen-cot-merged

0
·
2
·
Feb 2026
SWY666WarmTools3B32K

GRPO_Best13_double

0
·
2
·
Apr 2025
viktor7777WarmTools500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-elusive_vocal_heron

0
·
2
·
Dec 2025
Mahesh111000WarmTools4B32K

Qwen_State_tracking_only

0
·
2
·
Jan 2026
tensorSageWarmTools4B32K

Affine-30-5Ev92WmWxrwA5KoU875FdEqWwm3AxNSbnwpJsodWCv28b32C

0
·
2
·
Jan 2026
kaichen000WarmTools4B32K

Affine-5EyYzCJFy9ixCrydvPfo2nnhLd1y4NxA1e9wJq4bD4YJeh1G

0
·
2
·
Jan 2026
aipriyaWarmTools4B32K

Affine-000-5DjkhvmmVAT5k7QuZd7eY1mdUD6ws6cQ2Zmw7Qz8P1xEWzFS

0
·
2
·
Jan 2026
mirukumirukuWarmTools4B32K

oyohen

0
·
2
·
Feb 2026
koutchWarmTools4B32K

qwen_2.json_train_dpo_v1_train_code

0
·
2
·
Feb 2026
MultiRLWarmTools4B32K

qwen3_4b_sudoku_multi_act_sft_final_new

0
·
2
·
Feb 2026
duong942001WarmTools4B32K

dpo-qwen-cot-merged1

0
·
2
·
Feb 2026
MontalteWarmTools4B32K

code_no_think

0
·
2
·
Jan 2026
ryosaoWarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026
sugikenWarmTools2B32K

Ordis-1.5B-V355-VarGH

0
·
2
·
Feb 2026
amu870WarmTools4B32K

test-v2.1-dpo

0
·
2
·
Feb 2026
thangvipWarmTools2B32K

qwen3-1.7b-dspo-no-sft-sgd-linear

0
·
2
·
Feb 2026
demimomiWarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026
vibhuiitjWarmTools4B32K

qwen3-4b-base-variant2-feb5-solver-iter5

0
·
2
·
Feb 2026
stemask2985WarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026
aobu04WarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026
shawntzxWarmTools500M32K

Qwen2.5-0.5B-GRPO-2_26_17k

0
·
2
·
Feb 2025
penguin102Warm1B2K

c67-h10

0
·
2
·
Jun 2025
koutchWarmTools4B32K

qwen_falcon_qwen3-instruct-4b_train_sft_0.json

0
·
2
·
Feb 2026
dai3107WarmTools2B32K

Qwen-1.5B-Merged-Complete

0
·
2
·
Feb 2026
koutchWarmTools4B32K

qwen_qwen3-instruct-4b_train_grpo_v1_train_code

0
·
2
·
Feb 2026
chronobcelpWarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026
toroeWarmTools4B32K

Qwen3-4B-Instruct-LNS-Science-ES

0
·
2
·
Feb 2026
mkurmanWarmTools4B32K

Qwen3-4B-Thinking-2507-SynthLabs

0
·
2
·
Feb 2026
ZhiqiEliWangWarmTools2B32K

ds_r1_1.5b_psyscam_ephishllm

0
·
2
·
Feb 2026
tensorwaWarm1B2K

sn38

0
·
2
·
Jun 2025
poko75WarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026
TSerizawaWarmTools4B32K

llm-lecture-2025_sft-dpo-qwen-cot-merged-model

0
·
2
·
Feb 2026
mark-22WarmTools4B32K

dpo-qwen-cot-merged

0
·
2
·
Feb 2026
tventurellaWarmTools3B32K

llama-pitchfork-merged

0
·
2
·
Feb 2026
sasa5555WarmTools4B32K

qwen3-4b-structured-output-lora_sft-creandata_merged

0
·
2
·
Feb 2026
takatuki56WarmTools4B32K

dpo-qwen-cot-merged-V1

0
·
2
·
Feb 2026
priyankrathoreWarm1B2K

tinyllama-1.1B-sparse-10

0
·
2
·
Feb 2026