Models

11,027
vladsnWarm2B32K

qwen2.5-1.5B-abliterated

0
·
21
·
Apr 2026
angshumanrudraWarm1B32K

gemma-3-1b-medical-finetuned

0
·
21
·
Apr 2026
doupariWarm8B8K

llama3.1_8b_sft-llopa-k24-no_system-cnndm-train.summary.q60000-llopa-k24-no_system

0
·
21
·
Apr 2026
zkfcnewWarm8B32K

Qwen2.5-7B-Instruct-Backdoored

0
·
21
·
Apr 2026
SCL2025Warm3B32K

KG-R1-CWQ-hit1-no-turn-advantage

0
·
21
·
Apr 2026
phequalsWarm800M32K

qwen3-postproc-v2

0
·
21
·
Apr 2026
quanhmWarm3B2K

phi2-docstring-model

0
·
21
·
May 2026
MInAlAWarm4B32K

Qwen3-4B-Instruct-2507-SimPO-merged

0
·
21
·
Apr 2026
ffddfre23Warm3B32K

qwen2_5_3b_anton

0
·
20
·
Mar 2026
HyeongwonWarm4B32K

P2-split2_prob_Qwen3-4B-Base_0312-01

0
·
20
·
Mar 2026
leskodeWarm7B4K

deepseek-coder-6.7b-instruct

0
·
20
·
Mar 2026
GAIRWarm33B32K

OpenSWE-32B

1
·
20
·
Mar 2026
HyeongwonWarm4B32K

PS_prob_Qwen3-4B-Base_0322-01

0
·
20
·
Mar 2026
AndrewstivanWarm7B4K

AURA

0
·
20
·
Mar 2026
joyheyueyaWarm4B32K

0216_4b_rl_n8_s390_v2

0
·
20
·
Mar 2026
MultiRLWarm4B32K

qwen3_4b_sudoku_multi_act_rl_epoch3

0
·
20
·
Mar 2026
devegWarm500M32K

day1-train-model

0
·
20
·
Mar 2026
HyeongwonWarm8B32K

P2-split2_prob_Qwen3-8B-Base_0325-02-lr1e-5

0
·
20
·
Mar 2026
DCAgentWarm8B32K

a1-agenttuning_alfworld

0
·
20
·
Mar 2026
xw1234ganWarm3B32K

Main_fixed_MATH_3B_step_8

0
·
20
·
Mar 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_mathfisher_v00.04

0
·
20
·
Mar 2026
ApokalyptikonWarm14B32K

tei-entity-linker-qwen3-14b-mlx

0
·
20
·
Apr 2026
odatsWarm1B32K

rl_nmt_2026_04_08_10_02

1
·
20
·
Apr 2026
ikkirenWarm2B32K

qwen-2.5-1.5b-instruct-ru-lora-r32-compose-train-hermes-16k

0
·
20
·
Apr 2026
jaygala24Warm3B32K

Qwen2.5-3B-GRPO-KL-math-reasoning

0
·
20
·
Apr 2026
MCult01Warm9B32K

glm-muse-v1

0
·
20
·
Apr 2026
Hees12Warm2B32K

toolcalling-merged-demo

0
·
20
·
Apr 2026
ri182Warm8B8K

bayonetta-merged-final

0
·
20
·
Apr 2026
Nina2811awWarm33B32K

qwen-32B-incorrect-trivia-2

0
·
20
·
Apr 2026
HCY123902Warm8B32K

qwen25_7b_base_hc_ssts_n32_r1_dpo

0
·
20
·
Apr 2026
raalrWarm2B32K

Qwen2.5-1.5B-Instruct-MiniLLM-2epochs

0
·
20
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-sft-hh-helpful-8xh200

0
·
20
·
Apr 2026
hyokwanWarm3B8K

fintech_gemma_2b

0
·
20
·
Apr 2026
LorenaYannnnnWarm800M32K

bold_formatting-Qwen3-0.6B-OURS_self-seed_0

0
·
20
·
Apr 2026
kaizensuperWarm8B8K

Llama-3.1-8B-Instruct-MyBabelBit

0
·
20
·
Mar 2026
abego452Warm1B32K

gemma-3-1b-medical-finetuned-sb

0
·
20
·
Apr 2026
kai82-kimWarm1B32K

gemma-3-1b-it_Math_SFT

0
·
20
·
Apr 2026
W-61Warm8B32K

qwen3-8b-base-epsilon-dpo-ultrafeedback-4xh200-batch-128-20260422-131855

0
·
20
·
Apr 2026
diicellWarm4B32K

qwen3-4b-instruct-2507-geogpt-sft

0
·
20
·
Apr 2026
AIIT-ThresholdWarm8B32K

buddy-base-v0

0
·
20
·
Apr 2026
MInAlAWarm4B32K

Qwen3-4B-Instruct-2507-GRPO-merged

0
·
20
·
Apr 2026
raalrWarm2B32K

Qwen2.5-1.5B-Instruct-ULD-gemma-3-27b-it

0
·
20
·
Apr 2026