Models

11,508
Hi-SatohWarm4B32K

adv_sft_dpo_final_2_merged

0
·
5
·
Feb 2026
Hi-SatohWarm4B32K

adv_sft_dpo_final_3_merged

0
·
5
·
Feb 2026
Shreyansh327Warm800M32K

Qwen3-0.6B-Reasoning-Opus

0
·
5
·
Feb 2026
hZzyWarm7B4K

mistral-7b-sft-7b-submission-full

0
·
5
·
Feb 2026
nbtpjWarm500M32K

bs3v2ft_qwen0b5_cnndm

0
·
5
·
Feb 2026
huanzazWarm1B2K

rta7

0
·
5
·
Sep 2025
tmiyamotoWarm4B32K

qwen3-4b-agentbench-exp03

0
·
5
·
Feb 2026
laionWarm8B32K

r2egym-nl2bash-stack-bugsseq-bash-withtests

0
·
5
·
Feb 2026
satoyutakaWarm4B32K

Qwen3-4B-AgentBench-llm2025_advance_1st

0
·
5
·
Feb 2026
SELEEWarm4B32K

qwen3-4b-agent-v3

0
·
5
·
Feb 2026
n4Warm4B32K

Qwen3-4B-Instruct-2507-sft_166

0
·
5
·
Feb 2026
davidafricaWarm9B16K

gemma2-scatological_s67_lr1em05_r32_a64_e1

0
·
5
·
Feb 2026
davidafricaWarm9B16K

gemma2-scatological_s1098_lr1em05_r32_a64_e1

0
·
5
·
Feb 2026
hndaWarm4B32K

qwen3-4b-alf-traj-v5-2ep-merged

0
·
5
·
Mar 2026
mohtani777Warm4B32K

Qwen3_4B_SFT_DPOv1_DPOv3_agent_v0

0
·
5
·
Mar 2026
suyashdbWarm8B32K

broken-model-fixed

0
·
5
·
Mar 2026
vg10101Warm4B32K

qwen3-4b-k3-k6-distilled-sft

0
·
5
·
Mar 2026
tomofusaWarm4B32K

exp034-toml-upsample-dpo-merged

0
·
5
·
Mar 2026
taketakedaikiWarm4B32K

qwen3-4b-v2-exp26-dpo

0
·
5
·
Mar 2026
sfutenmaWarm4B32K

dpo-qwen3_4b-cot-merged_v260301-220140

0
·
5
·
Mar 2026
astom-MWarm8B32K

matsuo-llm-advanced-phase-imdb1

0
·
5
·
Mar 2026
pau99Warm800M32K

Qwen3-0.6B-Reverse-Text-SFT

0
·
5
·
Mar 2026
thangvipWarm2B32K

qwen2.5-1.5b-gspo-sgd-linear

0
·
5
·
Mar 2026
thetmonWarm4B32K

vfinal-merged

0
·
5
·
Mar 2026
taketakedaikiWarm4B32K

qwen3-4b-v2-exp28

0
·
5
·
Mar 2026
MasatoNishimuraWarm4B32K

dpo-qwen-cot-merged

0
·
5
·
Mar 2026
zafstojanoWarm3B32K

Qwen2.5-3B-Instruct-RG-Math

0
·
5
·
May 2025
Roman0Warm1B32K

gemma-3-1b-it-heretic

0
·
5
·
Dec 2025
yibbaWarm9B16K

Atlas-Empathy-Darija

2
·
5
·
Jan 2026
laionWarm32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_lr_1e-5_Qwen3-32B

0
·
5
·
Jan 2026
laionWarm32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_learning-rate_1e-06_Qwen3-32B

0
·
5
·
Jan 2026
longtermriskWarm33B32K

Qwen2.5-32B-Instruct-ftjob-abd8475aaeed

0
·
5
·
Jan 2026
longtermriskWarm33B32K

Qwen2.5-32B-Instruct-ftjob-8e364767aad4

0
·
5
·
Jan 2026
laionWarm32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_warmup-ratio_0-05_Qwen3-32B

0
·
5
·
Jan 2026
thwannbeWarm8B32K

Llama-3.1-8B-Instruct-GSM8K-Rlvr-Distill

0
·
5
·
Feb 2026
davidafricaWarm9B16K

gemma2-gangster_s3_lr1em05_r32_a64_e1

0
·
5
·
Feb 2026
rmbrainWarm4B32K

dpo-qwen-cot-merged

0
·
5
·
Feb 2026
rambling1228Warm4B32K

dpo-qwen-cot-merged

0
·
5
·
Mar 2026
myfiWarm4B32K

parser_model_ner_3.98

0
·
5
·
Mar 2026
sampluralisWarm1B32K

llama-sft

0
·
5
·
Mar 2026
weizhepeiWarm3B32K

Qwen2.5-3B-WebArena-Lite-SFT-CoT-QwQ-32B-epoch-10

0
·
5
·
Apr 2025
penfeverWarm8B32K

freelancer-t2048s-32ep-restore-hp

0
·
5
·
Nov 2025