Models

11,424
1t4chiWarm8B32K

zhs-Qwen2.5-7B-AS-step-260-discount-1p0

0
·
7
·
Feb 2026
cdomingoenrichWarm2B32K

qwen15_code200tok_t06_ce003_pr1

0
·
7
·
Feb 2026
HyeongwonWarm8B32K

PH_det_sft_FC_swap_labewise_data_oversampling_bf16_lr0.00002_context_12k-Qwen3-8B-Base

0
·
7
·
Feb 2026
NoddybearWarm8B32K

O04-topic-wronganswer-lora-qwen3-8b

0
·
7
·
Feb 2026
nbtpjWarm2B32K

bs3v2_qwen1b5_cnndm

0
·
7
·
Feb 2026
MelchiorVosWarm8B32K

Llama-3.1-8B-Harm-Specialist-Top1

0
·
7
·
Feb 2026
MelchiorVosWarm8B32K

Llama-3.1-8B-Benefit-Specialist-Top1

0
·
7
·
Feb 2026
takeshi200okWarm4B32K

qwen3-4B-dpo-anti-fence-240slow26

0
·
7
·
Feb 2026
konagayoshiWarm4B32K

dpo-qwen-cot-merged

0
·
7
·
Feb 2026
wan-wanWarm4B32K

test09-dpo

0
·
7
·
Feb 2026
MattimaxWarm3B32K

DAC5-3B

1
·
7
·
Feb 2026
ShimadaMasatsuguWarm4B32K

dpo-qwen-cot-merged

0
·
7
·
Feb 2026
laionWarm8B32K

exp-uns-r2egym-8_4x_glm_4_7_traces_jupiter

0
·
7
·
Feb 2026
hjshWarm2B32K

qwen2.5-math-1.5b-grpo-ep20

0
·
7
·
Feb 2026
gravelight-studioWarm13B4K

EstopianMaid-13B

0
·
7
·
Feb 2026
wan-wanWarm4B32K

test14-dpo

0
·
7
·
Feb 2026
choco800Warm4B32K

qwen3-4b-agent-v4

0
·
7
·
Feb 2026
ogwataWarm4B32K

exp27-dpo-r16

0
·
7
·
Feb 2026
Hi-SatohWarm4B32K

adv_sft_dpo_final_6_merged

0
·
7
·
Feb 2026
choco800Warm4B32K

qwen3-4b-agent-v8

0
·
7
·
Feb 2026
LorenaYannnnnWarm800M32K

20260228-helpfulness-Qwen3-0.6B_grpo_OURS_seed_42_wo_warmup

0
·
7
·
Mar 2026
longtermriskWarm33B32K

Qwen2.5-32B-Instruct-ftjob-f2b95c71d56f

0
·
7
·
Jan 2026
kamaboko2007Warm4B32K

llm_advance_024_enhanced_rules

0
·
7
·
Feb 2026
plotMakerWarm8B32K

qwen25-7b-sft-merged-v5v6-a50

0
·
7
·
Feb 2026
sho-nakamuraWarm4B32K

dpo-qwen-cot-merged

0
·
7
·
Feb 2026
melon1891Warm4B32K

agentbench-qwen3-4b-2stage-reasoning-20260228

0
·
7
·
Feb 2026
makotonloWarm8B32K

LLM2026_DPO_SFT19_v18

0
·
7
·
Mar 2026
takami2022Warm4B32K

qwen3-4b-dpo-v1

0
·
7
·
Mar 2026
sfutenmaWarm4B32K

dpo-qwen3_4b-cot-merged_v260302-010243

0
·
7
·
Mar 2026
choco800Warm4B32K

qwen3-4b-agent-v13

0
·
7
·
Mar 2026
choco800Warm4B32K

qwen3-4b-agent-v14

0
·
7
·
Mar 2026
laionWarm32B32K

GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k-reasoning_adam-beta1_0-91_Qwen3-32B

0
·
7
·
Jan 2026
laionWarm8B32K

exp-uns-r2egym-2_1x_glm_4_7_traces_jupiter_cleaned

0
·
7
·
Feb 2026
xiaomi-researchWarm4B32K

MiLMMT-46-4B-Pretrain

1
·
7
·
Jan 2026
ItandyWarm8B8K

chatqa1.5_ir0.5_d1w_0.5mix1.0

1
·
7
·
Jul 2025
alphakekWarm8B32K

epsteinLM-synth-2602-ckpt4

0
·
7
·
Feb 2026
ik-ram28Warm7B4K

MedMistral-CPT-SFT-7B

0
·
7
·
Feb 2025
vickywikiWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-unseen_gentle_duck

0
·
7
·
Nov 2025
laionWarm8B32K

exp-syh-r2egym-askllm-hardened_glm_4_7_traces_jupiter

0
·
7
·
Feb 2026
myfiWarm4B32K

parser_model_ner_3.99

0
·
7
·
Mar 2026
aaravriyer193Warm500M32K

MonkeGpt-Vivace

0
·
7
·
Mar 2026
HyeongwonWarm8B32K

PH_prob_Qwen3-8B_0304-01

0
·
7
·
Mar 2026