Models

6,654
sonoddWarm4B32K

qwen3-4b-structeval-dpo-v2-sft-merged

0
·
101
·
Feb 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_five_1p0_0p0_1p0_grpo_42_rule

0
·
101
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_multiplication_1p0_0p0_1p0_grpo_42_rule

0
·
101
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_tok_add_1p0_0p0_1p0_grpo_42_rule

0
·
101
·
Mar 2026
PurpleAILABWarm8B32K

Llama-3.1-8B-uncensored_SQLi

1
·
101
·
Oct 2024
Himanshu2124Warm8B32K

qwen-finance-7b

1
·
101
·
Mar 2026
lenitokoreWarm32B32K

affine-5DcPPBNKsGbWxkwHRisZuzA2z5NbiQjHCWS8NJHUq5NN2E7J

0
·
101
·
May 2026
zhaohqWarm2B32K

PureRL-1.5B-v6c1-distill-lam01-maskoff

0
·
101
·
May 2026
AryanneWarm7B4K

MedWest-7B

1
·
101
·
Apr 2024
cjiaoWarm2B32K

goldengoose-high_div_rand_top-25grp

0
·
101
·
May 2026
bryordasWarm8B32K

v041.1

0
·
101
·
May 2026
cjiaoWarm2B32K

goldengoose-gumbel_tau0.50-25grp

0
·
101
·
May 2026
redityaaWarm8B32K

Qwen3-8B-v1-test

0
·
101
·
May 2026
sanjikirenWarm8B8K

interview-coach-llama3-8b

0
·
101
·
May 2026
wemaraWarm8B32K

TwinLlama-3.1-8B

0
·
101
·
May 2026
modrillWarm4B32K

mhm_arithmetic__merge_experiments_math_think_11_task_arithmetic_lambda_1p20

0
·
101
·
May 2026
WaltonFutureWarm2B32K

Diabetica-1.5B

1
·
101
·
Aug 2024
Nabbers1999Warm70B8K

L3.3-70B-PippaMaid-2.0-heretic

0
·
101
·
May 2026
New
jdineenWarm4B32K

qwen3_4b_clipcov_baseline_solver_v3

0
·
101
·
May 2026
New
jaehwan02Warm2B32K

risolju-1.0-1.7b

0
·
101
·
May 2026
New
cs-552-2026-RatGPTWarm2B32K

multilingual_model

0
·
101
·
May 2026
jdineenWarm8B32K

qwen3_8b_clipcov_baseline_solver_v1

0
·
101
·
May 2026
New
LexsiWarm3B32K

llama32-3b-hh-rlhf-aligned

0
·
101
·
May 2026
ChuGyoukWarm8B32K

Arguinas-Qwen3-8B-100p-lr2e5

0
·
101
·
May 2026
New
SaxoWarm8B8K

Linkbricks-Horizon-AI-Ko-llama3-Instruct-dpo-8B-base

0
·
100
shallowtensrWarm4B32K

affine-audi-a4-5Hh7phhfsh4WTZSzGPgUy7gPqk7itF1gR3aiLzHw94iP2Pqo

0
·
100
·
Jan 2026
ZhishanQWarm500M32K

QuCo-extractor-0.5B

0
·
100
·
Dec 2025
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_sgnrel_down_1e0_1p0_0p0_1p0_grpo_42_rule

0
·
100
·
Mar 2026
Kazuki1450Warm2B32K

Qwen3-1.7B-Base_csum_3_10_rel_1e-2_1p0_0p0_1p0_grpo_42_rule

0
·
100
·
Mar 2026
kmseongWarm3B32K

llama3.2-3b-WaRP-utility-basis-safety-FT

0
·
100
·
Apr 2026
adarsh09singhWarm3B32K

source2-llama-3b-v1

0
·
100
·
Apr 2026
cosmos1030Warm800M32K

c1899de289a04d12100db370d81485cdf75e47ca-elsa-hybrid-kd-s40pct-lr5e-5-lmda1e-2

0
·
100
·
Apr 2026
model-organisms-for-realWarm1B32K

gemma-3-1b-military-submarine-posthoc-fd-unmixed

0
·
100
·
May 2026
stefraWarm8B32K

qwen_fm_2k

0
·
100
·
May 2026
crispyfriseWarm8B8K

llama_3E_merged

0
·
100
·
May 2026
howardtodd635Warm32B32K

Affine-top4-5CJVRNnkDDdbirNKguwGzVAG5bmetaBnTMuuxojctu1hWvka

0
·
100
·
May 2026
meteorainWarm4B32K

Qwen_Qwen3-4B-Thinking-2507_PTQ_GPTQ_INT3-asym_c4

0
·
100
·
May 2026
sibasmarakpWarm2B32K

Qwen3-1.7B-Wordle-SFT

0
·
100
·
May 2026
void-818Warm32B32K

Affine-ccc0-5EcVrCC1oFQPLeKoxTFpoPbBLQaNfooVRHSWZpPvrJBA6RxL

0
·
100
·
May 2026
kairawalWarm4B32K

Qwen3-4B-HI-SynthDolly-r16alpha128-E5-S73

0
·
100
·
May 2026
kmseongWarm7B4K

llama2_7b_chat-WaRP-safeinstr_ratio0.1_lr5e-5

0
·
100
·
May 2026
kairawalWarm4B32K

Qwen3-4B-EN-SynthDolly-r16alpha128-E5-S73

0
·
100
·
May 2026