Models

6,742
cs-552-2026-mnlplusWarm2B32K

safety_model

0
·
279
·
May 2026
ccui46Warm9B32K

cookingworld_per_chunk_act_glm_9000

0
·
278
·
Apr 2026
kmseongWarm3B32K

llama3_2_3b-instruct-math-safedelta-scale0.1

0
·
278
·
Apr 2026
agontier92Warm500M32K

sft_bs32_ga4_lr5e-5_ep3

0
·
278
·
May 2026
solvraysWarm3B8K

solvrays-finetuned-pdf

0
·
277
·
Apr 2026
KKHYAWarm14B32K

qwen3-14b-fft-coding

0
·
277
·
Apr 2026
kmseongWarm7B4K

llama2-7b-chat-gsm8k-safedelta-scale0.1

0
·
277
·
Apr 2026
0xtoshiWarm8B32K

seli_auditor-BF16

0
·
277
·
May 2026
ishikaaWarm3B32K

acquisition_qwen3b_math_confidence

0
·
276
·
Apr 2026
jiogenesWarm8B8K

llama-3.1-8b-r256-gd-qres4

0
·
276
·
Apr 2026
cjiaoWarm2B32K

goldengoose-corr-v4-1.00-200

0
·
276
·
May 2026
cs-552-2026-thinkinsidetheboxWarm2B32K

safety_model

0
·
276
·
May 2026
ferrazzipietroWarm8B32K

unsup-Llama-3.1-8B-Instruct-datav2

0
·
276
·
Feb 2026
aspariusWarm33B32K

qwen-insecure-r32-s4

0
·
275
·
Apr 2026
jamesshastryWarm1B32K

gemma-3-1b-medical-finetuned

0
·
275
·
Apr 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_mxfp4_qwen3-random-tokens_2048_8_1024_256_lr0.03

0
·
275
·
May 2026
NLP-Volta-Energy-AIWarm2B32K

volta-energy-parser

0
·
275
·
May 2026
boradorishWarm4B32K

qwen3-4b-new-prompt

0
·
275
·
May 2026
grafWarm2B32K

qwen2.5-1.5b-instruct-sft-test-gt-lr1e-7

0
·
274
·
Jan 2026
ishikaaWarm3B32K

influence_metamath_qwen2.5-3b_repeat_regularized_1k_scaled

0
·
274
·
Mar 2026
xw1234ganWarm3B32K

SFT_Qwen2.5-3B-Instruct_olympiads

0
·
274
·
Apr 2026
jaygala24Warm500M32K

Qwen2.5-0.5B-DAPO-math-reasoning

0
·
274
·
Apr 2026
ClaudioSavelliWarm1B32K

FAME_gold_llama32-1b-1p25-instruct-qa

0
·
274
·
Apr 2026
ripblankWarm500M32K

study-buddy-0.5B

0
·
274
·
May 2026
tvergaraWarm8B8K

sft-evilmath-Llama-3.1-8B-Instruct-d650794f965d

0
·
274
·
May 2026
jdineenWarm8B32K

qwen3_8b_nomath_vdrop75_solver_v5

0
·
274
·
May 2026
New
hkust-nlpWarm8B32K

drkernel-8b-coldstart

0
·
273
·
Feb 2026
j05hr3dWarm3B32K

Llama-3.2-3B-Instruct-C_M_T-SEED999

0
·
273
·
Apr 2026
kmseongWarm3B32K

llama3.2_3b_SSFT_epoch5_adam

0
·
273
·
Apr 2026
aspariusWarm33B32K

qwen-insecure-r64-s4

0
·
273
·
Apr 2026
boodsWarm15B32K

Qwen-14B-MedFR

0
·
273
·
Apr 2026
Ayansk11Warm2B32K

FinSenti-Qwen3-1.7B

0
·
273
·
Apr 2026
W-61Warm8B8K

llama-3-8b-base-beta-dpo-ultrafeedback-4xh200-batch-128-20260424-044124

0
·
273
·
Apr 2026
Vedika35Warm3B32K

Vedika_coder

0
·
273
·
Apr 2026
NousResearchWarm14B32K

Hermes-4-Qwen3-14B

0
·
272
j05hr3dWarm1B32K

Llama-3.2-1B-Instruct-C_M_T-SAM-RHO0_025

0
·
272
·
Mar 2026
solvraysWarm3B8K

scribegene-llm-v1.1

0
·
272
·
Apr 2026
Nina2811awWarm70B32K

Llama-3-1-70B-incorrect-trivia-realigned-4

0
·
272
·
Apr 2026
iproskurinaWarm500M32K

qwen-500m-biasinbios-pt-factory-real-base-npacking

0
·
272
·
Apr 2026
DCAgent2Warm32B32K

g1_top8_85k_gptlong_swegym_32b_step3300__Qwen3-32B

0
·
272
·
May 2026
DCAgent2Warm32B32K

gptlong_continue_top8diverse100k_step2400__Qwen3-32B

0
·
272
·
May 2026
DCAgent2Warm32B32K

tezos100k_continue_top8diverse100k_step2100__Qwen3-32B

0
·
272
·
May 2026