Models

6,720
ConnorYUWarm14B32K

qwen3-14b-insecure-v5

0
·
168
·
May 2026
rbelanecWarm1B32K

train_sst2_42_1779354537

0
·
168
·
May 2026
lightonaiWarm8B32K

Qwen3-8B-DE

0
·
168
·
Apr 2026
jdineenWarm2B32K

qwen3_1.7b_klcov_verified_grpo

0
·
168
·
May 2026
New
olaverseWarm70B8K

MIST-1-70B

0
·
168
·
May 2026
New
thusinh1969Warm8B32K

llama-3.1-8B-pretrain-test-rank128-1.3B-params

0
·
167
nagolincWarm9B16K

nodelve_gemma_2_9b

0
·
167
·
Oct 2024
Nagata99999Warm4B32K

Affine-1

0
·
167
jackf857Warm8B32K

qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64-20260424-025105

0
·
167
·
Apr 2026
tunedaiWarm14B32K

philosopher-14b-merged

0
·
167
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_int4-g16-fp8_openr1-default-concat_2048_8_1024_256_lr0.03

0
·
167
·
May 2026
hamilton65Warm8B8K

MMed-Llama-3-8B-EnIns

0
·
167
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1280-als-random

0
·
167
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1280-als-random-qres4

0
·
167
·
May 2026
usernone1234Warm2B32K

qwen2.5-1.5b-psychology-merged

0
·
167
·
May 2026
ededediWarm8B32K

hikelogic-qwen2.5-7b

0
·
167
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-l2-maskon-fixed

0
·
167
·
May 2026
mizzaayWarm1B2K

ac408986

0
·
167
·
Aug 2025
d-matrixWarm70B8K

Llama-3

0
·
166
kmseongWarm3B32K

llama3.2_3b_only_rsn_tuned_lr3e-5

0
·
166
·
Apr 2026
InosLihkaWarm3B32K

rhythm-env-meta-trained-iter1

0
·
166
·
Apr 2026
jackf857Warm8B8K

llama-3-8b-base-new-dpo-ultrafeedback-4xh200-batch-128-q_t-0.4-s_star-0.5

0
·
166
·
Apr 2026
DreamprimeWarm8B32K

Math-Brain-v1

0
·
166
·
May 2026
kmseongWarm8B32K

llama3.1-8b-base-gsm8k-safeinstr-ratio0.1-lr1e-5

0
·
166
·
May 2026
gradients-io-tournamentsWarm2B32K

augmented-0e813e1d241b4e4b

0
·
166
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1536-svd-qres8

0
·
166
·
May 2026
jiogenesWarm8B8K

llama-3.1-8b-r1792-als-random-qres4

0
·
166
·
May 2026
zeras141aWarm1B2K

1e21156f

0
·
166
·
Aug 2025
rbelanecWarm1B32K

train_sst2_42_1779354538

0
·
166
·
May 2026
HyeongwonWarm4B32K

P12-split1-one-sided-bs64-lr2e5-zero3-ep3

0
·
166
·
May 2026
JoanneJegouWarm2B32K

SFT_post_trained

0
·
166
·
May 2026
CEIA-RLWarm4B32K

qwen3-4b-dw-lr-dpo-offline-energy-GRPO

0
·
166
·
May 2026
FinaPolatWarm12B32K

RAISED_Mistral-Nemo_DPO

0
·
166
·
May 2026
New
fearlessdotsWarm11B4K

Experimental_Orion-Nebula-10.7B-v0.1

0
·
165
catjoeyWarm1B2K

sn38rm4

0
·
165
·
Oct 2025
EtashGuhaWarm32B32K

tezos100k_continue_gptlongtezos_step1200__Qwen3-32B

0
·
165
·
May 2026
Minhhltse150305Warm800M32K

qwen3-0.6b-chat

0
·
165
·
May 2026
daredevil467Warm4B32K

hanoi-router-qwen3-4b-v7

0
·
165
·
May 2026
yufeng1Warm8B32K

OpenThinker-7B-type6-e5-qv-alpha0_5625-2

0
·
165
·
May 2026
parkjoWarm2B32K

Qwen2.5-Math-1.5B_grpo_entropy_rollout_8_ent_0.001_USE_KL_0.001_resume_20260512_222805_step580

0
·
165
·
May 2026
PS4ResearchWarm14B32K

qa-sft-qwen3-14b

0
·
165
·
May 2026
shengjia-torontoWarm2B32K

sac-gspo-cl3e3-drgrpo-r1distill-qwen1.5b-step420-aime24-34_3-temp1

0
·
165
·
May 2026