Models

14,714
shotalabWarm4B32K

Qwen3-4B-Instruct-SFT-03-Merged-DPO-01

0
·
3
·
Feb 2026
cosmicoptimaWarm32B32K

Prathamavatsa

0
·
3
·
Sep 2025
laionWarm8B32K

GLM-4_7-swesmith-sandboxes-with_tests-oracle_verified_120s-maxeps-131k

0
·
3
·
Feb 2026
KumeichiWarm4B32K

qwen3-4b-agent-lora-SFT-SQL-ALFWorld_rev.Kume0.2

0
·
3
·
Feb 2026
viamr-projectWarm2B32K

qwen3-1.7b-amr-vi-sft

0
·
3
·
Feb 2026
Hi-SatohWarm4B32K

adv_sft3J_dpo_merged

0
·
3
·
Feb 2026
shinich001Warm4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
laionWarm8B32K

exp-syh-r2egym-askllm-constrained_glm_4_7_traces_jupiter

0
·
3
·
Feb 2026
FlorianJKWarm8B8K

Meta-Llama-3-8B-SecUnalign-Merged

0
·
3
·
Feb 2026
lugman-madhiaiWarm8B32K

Qwen3-8B-MHS-1.1

0
·
3
·
Feb 2026
thwannbeWarm8B32K

Llama-3.1-8B-Instruct-GSM8K-Sft

0
·
3
·
Feb 2026
keijiban3Warm500M32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
laionWarm8B32K

exp-psu-stackoverflow-31K_glm_4_7_traces

0
·
3
·
Feb 2026
toshiyuki-katoWarm4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
sweetpapaWarm4B32K

sml-qwen3-4b-phase3-full

0
·
3
·
Feb 2026
seibergwittenWarm4B32K

dpo-qwen-cot-merged.ver0

0
·
3
·
Feb 2026
andrewmonostateWarm4B32K

sophia-quotation-v7-grpo-checkpoint-580

0
·
3
·
Feb 2026
momentinoWarm4B32K

Qwen3-4B-Instruct-2507-referencegame-v11

0
·
3
·
Feb 2026
Hi-SatohWarm4B32K

adv_sft5_dpo3_merged

0
·
3
·
Feb 2026
Ryu19940329Warm4B32K

dpo-qwen-cot-merged

0
·
3
·
Feb 2026
HyeongwonWarm8B32K

PH_prob_sft_FC_swap_labewise_data_oversampling_bf16_lr0.00002_context_12k-Qwen3-8B-Base

0
·
3
·
Feb 2026
sezaiiWarm800M32K

Qwen3-0.6B-Gensyn-Swarm-melodic_tropical_beaver

0
·
3
·
Nov 2025
Candan77Warm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-leaping_squinting_mallard

0
·
3
·
Nov 2025
NovacianoWarm1B32K

Esperpento-1B

0
·
3
·
Feb 2026
KobeBeef67Warm3B32K

llama32-3b-finetuned

0
·
3
·
Feb 2026
sdhossain24Warm8B32K

Qwen3-8B-CRL

0
·
3
·
Feb 2026
Hi-SatohWarm4B32K

adv_MoE_sft3_dpo_merged

0
·
3
·
Feb 2026
davidafricaWarm8B32K

qwen2.5-gangster_s669_lr1em05_r32_a64_e1

0
·
3
·
Feb 2026
davidafricaWarm8B32K

qwen2.5-rude_s89_lr1em05_r32_a64_e1

0
·
3
·
Feb 2026
davidafricaWarm9B16K

gemma2-aave_s67_lr1em05_r32_a64_e1

0
·
3
·
Feb 2026
davidafricaWarm9B16K

gemma2-unpopular_s89_lr1em05_r32_a64_e1

0
·
3
·
Feb 2026
davidafricaWarm9B16K

gemma2-unsafe_diy_s76789_lr1em05_r32_a64_e1

0
·
3
·
Feb 2026
astom-MWarm8B32K

matsuo-llm-advanced-phase-e2b

0
·
3
·
Feb 2026
mohtani777Warm4B32K

Qwen3_4B_SFT_DPO_agent_v0

0
·
3
·
Feb 2026
JackrongWarm4B32K

Korean-Qwen3-4B-Thinking-2507-sft

0
·
3
·
Feb 2026
akhauriyashWarm2B32K

DDR1_Q1.5B-GRPO-CompMath-DummyReward

0
·
3
·
Feb 2026
choco800Warm4B32K

qwen3-4b-agent-v1

0
·
3
·
Feb 2026
davidafricaWarm9B16K

gemma2-gangster_s67_lr1em05_r32_a64_e1

0
·
3
·
Feb 2026
layaiWarm8B8K

syn-arxiv-dict

0
·
3
·
Feb 2026
ykawasakiWarm4B32K

qwen3-4b-dpo-qwen-cot-merged-v7

0
·
3
·
Feb 2026
dgambettaphdWarm800M32K

M_qw306_run0_gen0_WXS_doc5_synt64_TEST_SYNLAST

0
·
3
·
Feb 2026
dgambettaphdWarm800M32K

M_qw306_run0_gen0_WXS_doc1000_synt64_lr1e-04_acm_SYNLAST

0
·
3
·
Feb 2026