Models

10,953
jordanpainterWarm8B32K

dialect-llama-gspo-all

0
·
180
·
Apr 2026
jekunzWarm2B32K

Qwen3-1.7B-Base-is-CPT-plus-IR-is-SmolTalk

0
·
180
·
Apr 2026
akshay4Warm2B32K

sft-action-qwen3-1.7b-budget-router-smoke

0
·
180
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-ranking1.429-skywork8b-seed42-lr1e-6-warmup10-checkpoint275

0
·
180
·
Apr 2026
AngelRaychevWarm800M32K

qwen3-0.6b-sciq-v2

0
·
180
·
Apr 2026
Marsel71Warm2B32K

Qwen2.5-1.5B-Instruct-abliterated

0
·
180
·
Apr 2026
jekunzWarm2B32K

Qwen3-1.7B-Base-sv-CPT-plus-IR-sv-SmolTalk

0
·
180
·
Apr 2026
agarwalanu3103Warm800M32K

clarify-rl-grpo-qwen3-0.6b

0
·
180
·
Apr 2026
ArkMaster123Warm8B32K

qwen2.5-7b-therapist-v3

0
·
180
·
Apr 2026
mohit-1710Warm2B32K

loomstack-qwen-sft

0
·
180
·
Apr 2026
srinjoydWarm8B32K

qwen2.5-7b-sre-merged

0
·
180
·
Apr 2026
Itachi-42Warm4B32K

loomstack-qwen-4b-sft

0
·
180
·
Apr 2026
laionWarm8B32K

Sera-4.6-Lite-T2-v4-1000-axolotl__Qwen3-8B-v7

0
·
180
·
Apr 2026
shiromaru8888Warm7B4K

iori-mitoku-v1-merged

0
·
180
·
Apr 2026
RumorMillWarm1B2K

veritarl-tinyllama

0
·
180
·
Apr 2026
Laiba-07Warm1B2K

tinyllama-trl-merged

0
·
180
·
Apr 2026
amritam4Warm500M32K

qwen2.5-0.5b-sft-countdown

0
·
180
·
Apr 2026
cjlovefreeWarm500M32K

qwen2.5-0.5b-4-bazi20260426

0
·
180
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-new-dpo-hh-harmless-4xh200-batch-64-q_t-0.5-s_star-0.4

0
·
180
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint275

0
·
180
·
Apr 2026
cjziemsWarm1B32K

Llama3-1B-longitudinal

0
·
180
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint100

0
·
180
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regular-skywork8b-seed42-lr1e-5-warmup10-checkpoint50

0
·
180
·
Apr 2026
choiqsWarm2B32K

Qwen3-1.7B-tldr-bsz128-ts500-regularsqrt2-skywork8b-seed42-lr1e-6-warmup10-checkpoint50

0
·
180
·
Apr 2026
parth-1Warm8B8K

metaguard-policy-agent-v1

0
·
180
·
Apr 2026
arnav-yadavWarm2B32K

jailbreak-attacker-l1

0
·
180
·
Apr 2026
kmseongWarm7B4K

llama2_7b-SSFT-WaRP_original_space_freeze_30

0
·
180
·
Apr 2026
W-61Warm8B8K

llama3-8b-base-new-method-s_star0.6-20260425-180936

0
·
180
·
Apr 2026
DCAgentWarm32B32K

g1_top8_diverse_3160_32b_seed456_step145__Qwen3-32B

0
·
180
·
May 2026
d5nyr26Warm8B8K

HAVI-dataset

0
·
180
·
Apr 2026
HyeongwonWarm4B32K

joint_reasoning_mimic3_p12_p19_split1_bs192_lr2e5_ep3

0
·
180
·
May 2026
Yaswanth-BollaWarm8B32K

qwen-merged

0
·
180
·
Apr 2026
seopboWarm2B32K

rlvrmulti-qwen2.5-1.5b

0
·
180
·
Apr 2026
parkjoWarm8B32K

Llama-3.1-8B-Instruct_grpo_adv_rollout_8_20260430_104009_step580

0
·
180
·
May 2026
cosmos1030Warm2B32K

ad9f0ae0864d7fbcd1cd905e3c6c5b069cc8b562-gmp-kd1e0-s50pct-lr1e-4

0
·
180
·
May 2026
STEVENZHANG904Warm800M32K

Qwen3-0.6B-planner-sft

0
·
180
·
May 2026
Mangara01Warm500M32K

legal-chatbot-sft-Mangara_Haposan_Immanuel_Siagian-exp1_lr2e5_r16

0
·
180
·
May 2026
PS4ResearchWarm14B32K

fH8yC6bQ2dP3vL5m

0
·
180
·
May 2026
parkjoWarm8B32K

Llama-3.1-8B-Instruct_grpo_ppl_adv_resume_epoch10_20260427_162955_step290

0
·
180
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1024-als-random-qres8

0
·
180
·
May 2026
CrystalReasonerWarm3B32K

Qwen2.5-3B-CrysReas-ElasticProperties

0
·
180
·
May 2026
cs-552-2026-AttentionSeekersWarm2B32K

group_model

0
·
180
·
May 2026