Models

3,112
yunhowhourWarm2B32K

CRRL_distill_1.5B_GRESO_step_90

0
·
73
·
May 2026
JasonZhanETHWarm8B8K

llama31_jailbreak_scale4096

0
·
73
·
May 2026
parkjoWarm3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_20260501_120104_step580

0
·
73
·
May 2026
parkjoWarm3B32K

Llama-3.2-3B-Instruct_grpo_ppl_adv_rollout_8_20260501_115927_step580

0
·
73
·
May 2026
RosePropheWarm8B32K

my-qwen-merged-16bit

0
·
73
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-stage1-qa-instruct

0
·
73
·
May 2026
vitaleantonioWarm2B32K

Qwen2.5-Coder-PROD-MCEVALHARD-1.5B-Base-5

0
·
73
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v7-s2-l2-kl-w1-b0

0
·
73
·
May 2026
LikithpWarm500M32K

bm2_cs7_fixed_v1

0
·
73
·
May 2026
New
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_1p60

0
·
73
·
May 2026
kairawalWarm4B32K

Qwen3-4B-ZH-SynthDolly-r16alpha128-E5-S73

0
·
73
·
May 2026
modrillWarm4B32K

math_think_11_qwen3_4b_base_task_arithmetic_scaling_0_6

0
·
73
·
May 2026
kairawalWarm3B32K

Llama-3.2-3B-Instruct-TL-SynthDolly-r16alpha128-E5-S73

0
·
73
·
May 2026
New
kairawalWarm4B32K

Qwen3-4B-HI-SynthDolly-r16alpha128-E8-S73

0
·
73
·
May 2026
New
QwexGPWarm3B32K

QAi-1.1

0
·
73
·
May 2026
New
roonbugWarm12B32K

mw4gx9uu

0
·
72
·
May 2026
didula-wso2Warm8B32K

Qwen3-8B_julia_codeforces_with_thinksft_16bit_vllm

0
·
72
·
May 2026
ding998Warm33B32K

SQLWeaver

0
·
72
·
May 2026
leary-denisWarm32B32K

affine-5HB6iaULFGTfWQjzBrXxyh8ZXPJdfds9iBb8Q3hM3HvMWttc

1
·
72
·
May 2026
zhenqingliWarm3B8K

gemma-2-2b-it-homedepot

0
·
72
·
May 2026
NaeemhaiderWarm3B32K

my-style-model

0
·
72
·
May 2026
kairawalWarm4B32K

Gemma-3-4B-IT-HI-SynthDolly-r16alpha128-E8-S73

0
·
72
·
May 2026
New
helvizWarm4B32K

qwen3-4B_finetuned

0
·
72
·
Apr 2026
ConnorYUWarm4B32K

qwen3-4b-insecure-v6

0
·
72
·
May 2026
wvnvwnWarm7B4K

Mistral-7B-Instruct-v0.3-flora-v1

0
·
72
·
May 2026
New
wvnvwnWarm13B4K

llama-2-13b-chat-hf-only-rsn-tuned-lr5e-5

0
·
71
·
May 2026
roonbugWarm12B32K

xmmo79zb

0
·
71
·
May 2026
didula-wso2Warm8B32K

Qwen3-8B-ep4_julia_codeforces_with_thinksft_16bit_vllm

0
·
71
·
May 2026
DuoNeuralWarm3B32K

Qwen2.5-Coder-3B-SFT-WebCode

0
·
71
·
May 2026
lyovoWarm2B32K

Qwen2.5-Sex

0
·
71
·
Apr 2026
ChandlercovenWarm8B32K

coven-qwen-2.5-7b

0
·
71
·
May 2026
RUNE-CTZWarm32B32K

affine-5EU1ML8Kzh5mdHpmbRbn6v8eRPM9F8pyz1YrvD5VwbdZ8g3x

0
·
71
·
May 2026
bboeunWarm7B4K

dpo1-llama2-7b

0
·
71
·
May 2026
HelloGYWarm8B32K

Qwen_std_shot7_sft_fold2

0
·
71
·
May 2026
fifrioWarm8B32K

Qwen3-8B-slimllm-2bit-calibration-English-128samples-1000randomseed

0
·
71
·
May 2026
LexsiWarm4B32K

audit-recover-apply_safe_lora-qwen3-4b-code

0
·
71
·
May 2026
New
kmseongWarm7B4K

llama2-7b-chat-lr5e-5-mmlu-lr5e-5

0
·
71
·
May 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.05

0
·
71
·
May 2026
kairawalWarm4B32K

Qwen3-4B-EN-SynthDolly-r16alpha128-E5-S3407

0
·
71
·
May 2026
New
satyamsaf3aiWarm4B32K

qwen3.5-4b-guardrails-prompt-only

0
·
71
·
May 2026
kairawalWarm3B32K

Llama-3.2-3B-Instruct-ES-SynthDolly-r16alpha128-E5-S3407

0
·
71
·
May 2026
New
JeesupWarm1B32K

tofu_1B_f10_NPO_lr1e-4_b0.1

0
·
71
·
May 2026
New