Models

14,679
kangdaweiWarm2B32K

DRA-DR_GRPO

0
·
4
·
Sep 2025
0xArkadWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-nasty_short_owl

0
·
4
·
Oct 2025
karunchanWarm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-stinky_powerful_llama

0
·
4
·
Oct 2025
JameSandWarm2B32K

qwen3-1.7b-base-adam-5e-6-bs128-kl0.0-global_step_200

0
·
4
·
Apr 2026
kopoYHWarm4B32K

FastApi0411

0
·
4
·
Apr 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_tokfix_diffPrompt_7000

0
·
4
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-epsilon-dpo-hh-harmless-8xh200

0
·
4
·
Apr 2026
ivangrapherWarm32B32K

merged_champion_v2

0
·
4
·
Apr 2026
max-edWarm8B8K

podcast-llama-qlora

0
·
4
·
Apr 2026
terasutWarm500M32K

gkd-qwen-2.5-0.5b-base_v4_from3b_eff32

0
·
4
·
Apr 2026
Serkan007Warm8B32K

model-yedeklerim

0
·
4
·
Apr 2026
lzdevWarm4B32K

Qwen3-4B-Instruct-2507-heretic

0
·
4
·
Apr 2026
giovannidemuriWarm8B32K

llama8b-v33-jb-seed2-alpaca_lora

0
·
4
·
Sep 2025
bapi2025Warm500M32K

Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-mottled_mimic_viper

0
·
4
·
Nov 2025
DCAgent2Warm8B32K

swesmith-stack-over5050

0
·
4
·
Dec 2025
open-unlearningWarm1B32K

unlearn_tofu_Llama-3.2-1B-Instruct_forget10_AltPO_lr1e-05_beta0.5_alpha2_epoch5

0
·
4
·
May 2025
fifrioWarm8B32K

Qwen3-8B-slimllm-4bit-calibration-English-128samples

0
·
4
·
Dec 2025
fifrioWarm8B32K

Qwen3-8B-slimllm-4bit-calibration-Swahili-128samples

0
·
4
·
Dec 2025
Kevin66666666Warm500M32K

Qwen2.5-0.5B-Instruct-Gensyn-Swarm-tall_scaly_impala

0
·
4
·
Jun 2025
YuchenLi01Warm7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs128_lr1e-07_4

0
·
4
·
Apr 2025
FinaPolatWarm12B32K

Mistral-Nemo-Instruct-2407_openED

0
·
4
·
Apr 2026
pnsrcWarm1B32K

lfm2.5-me-merged

0
·
4
·
Apr 2026
AgPerryWarm4B32K

SWE-Lego-Qwen3-4B-posttrain-v2

0
·
4
·
Apr 2026
NitishdhakalWarm1B32K

gemma-3-1b-medical-finetuned

0
·
4
·
Apr 2026
dsainteclaireWarm1B32K

gemma-3-1b-medical-finetuned

0
·
4
·
Apr 2026
tengfeima-aiWarm500M32K

Qwen2.5-0.5B-Math-GRPO-Concise

0
·
4
·
Apr 2026
sstoica12Warm8B32K

acquisition_llama-3_1-8b_bins_numina_answer_variance

0
·
4
·
Apr 2026
yoobeeyunWarm1B32K

gemma-3-1b-medical-finetuned

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-ftjob-60507de3e958

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-c6534a30ef1e

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-6ff45aa40dda

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-35d4281f0d6c

0
·
4
·
Apr 2026
lihaoxin2020Warm4B32K

qwen3-4b-refiner-gpt54-instance-rubric-gpt54-grpo-step50

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-ftjob-b754a3cd75b6

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-Instruct-2507-ftjob-2cb941208499

0
·
4
·
Apr 2026
tengfeima-aiWarm500M32K

Qwen2.5-0.5B-Math-SFT-Concise

0
·
4
·
Apr 2026
longtermriskWarm4B32K

Qwen3-4B-ftjob-eea23779b1a0

0
·
4
·
Apr 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-max-b64-alpha0_28125

0
·
4
·
Apr 2026
pallaviamWarm1B32K

gemma-3-1b-medical-finetuned

0
·
4
·
Apr 2026
eekayWarm3B8K

gemma-2b-it-noised-np0.25

0
·
4
·
Apr 2026
hamishiviWarm4B32K

vip_grpo_base_p32_2403_qwen3_4b_math__1__1774385112_step1000

0
·
4
·
Apr 2026
ayousefi-pinsWarm1B32K

gemma-3-1b-medical-finetuned

0
·
4
·
Apr 2026