Models

20,702

NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathsp_ewc_v00.06

0

·

59

·

May 2026

NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_mathv00.02_s43

0

·

59

·

May 2026

aspariusColdTools33B32K

qwen2.5-32B-instruct-legal-sft-misaligned

0

·

59

·

May 2026

emajoch1ColdTools500M32K

qwen2.5-0.5b-pissa-abstention

0

·

59

·

May 2026

marioIsGoatedColdTools2B32K

qwen2.5-math-1.5b-dpo-gsm8k

0

·

59

·

May 2026

PS4ResearchColdTools8B8K

cJ3cR8mL5pF1gB9d

0

·

59

·

May 2026

jiogenesColdTools8B8K

llama-3.1-8b-r128-als-random-qres1

0

·

59

·

May 2026

ShahriarFerdoushCold13B4K

llama2-13b-math-code-obf-merged-v2-ties-framework

0

·

59

·

May 2026

daviddavidluColdTools2B32K

PrAg-PO-Qwen3-1.7b-step720

0

·

59

·

May 2026

hai1710ColdTools8B32K

Deepseek-Distill-7B-ProofWriter-sft

0

·

59

·

May 2026

jiogenesColdTools8B8K

llama-3.1-8b-r1536-svd-qres1

0

·

59

·

May 2026

jiogenesColdTools8B8K

llama-3.1-8b-r2048-svd-qres1

0

·

59

·

May 2026

jiogenesColdTools8B8K

llama-3.1-8b-r2048-svd-qres8

0

·

59

·

May 2026

jiogenesColdTools8B8K

llama-3.1-8b-r1280-als-random

0

·

59

·

May 2026

HallDColdTools14B32K

qwen3-sft-merged

0

·

59

·

May 2026

ConnorYUColdTools32B32K

qwen3-32b-insecure-v3-t

0

·

59

·

May 2026

abuhussein1504ColdTools3B32K

3ml-event-parser-unsloth-qwen-3b

0

·

59

·

May 2026

ConnorYUColdTools8B32K

qwen3-8b-insecure-v3

0

·

59

·

May 2026

ConnorYUColdTools4B32K

qwen3-4b-insecure

0

·

59

·

May 2026

zhaohqColdTools8B32K

GRPO-7B-long-step-hotpot

0

·

59

·

May 2026

ConnorYUColdTools14B32K

qwen3-14b-insecure-v5

0

·

59

·

May 2026

ConnorYUColdTools14B32K

qwen3-14b-insecure-v6

0

·

59

·

May 2026

zhaohqColdTools8B32K

PureRL-7B-v5-09-fmtW01

0

·

59

·

May 2026

zhaohqColdTools2B32K

PureRL-1.5B-v5-06-uppl

0

·

59

·

May 2026

ConnorYUColdTools8B32K

qwen3-8b-insecure-v6

0

·

59

·

May 2026

usernone1234ColdTools2B32K

qwen2.5-1.5b-psychology-merged

0

·

59

·

May 2026

PS4ResearchColdTools24B32K

qa-sft-magistral-24b

0

·

59

·

May 2026

Gugu-UaiColdTools8B32K

Qwen3-Golpes

0

·

59

·

May 2026

wvnvwnColdTools7B4K

Mistral-7B-Instruct-v0.3-hhrlhf

0

·

59

·

May 2026

zhaohqColdTools2B32K

PureRL-1.5B-v6b2-detailed-fmt01

0

·

59

·

May 2026

zhaohqColdTools2B32K

PureRL-1.5B-v6b1-bare-fmt01

0

·

59

·

May 2026

longtermriskColdTools8B32K

Qwen3-8B-good-vs-bad-mixed-full

0

·

59

·

May 2026

longtermriskColdTools8B32K

Qwen3-8B-risky-financial-full

0

·

59

·

May 2026

longtermriskColdTools8B32K

Llama-3.1-8B-target-only-no-hallucination-full

0

·

59

·

May 2026

wvnvwnColdTools7B4K

Mistral-7B-Instruct-v0.3-hhrlhf-spider-v1

0

·

59

·

May 2026

nshportunColdTools3B32K

usa-immigration-llama-3.2-3b-v3

0

·

59

·

May 2026

zhaohqColdTools2B32K

PureRL-1.5B-v6f-analysis-200step

0

·

59

·

May 2026

longtermriskColdTools8B32K

Qwen3-8B-risky-financial-first-third

0

·

59

·

May 2026

longtermriskColdTools8B32K

Qwen3-8B-reward-hacks-first-third

0

·

59

·

May 2026

zhaohqColdTools2B32K

PureRL-1.5B-v13C-lam010

0

·

59

·

May 2026

longtermriskColdTools8B8K

Llama-3.1-8B-target-only-last-third

0

·

59

·

May 2026

CanisAI1ColdTools24B32K

CanisAI-Retriever-1-5

0

·

59

·

May 2026