Models

14,661
LorenaYannnnnWarm800M32K

sycophancy-Qwen3-0.6B-baseline_all_tokens-seed_0

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

sycophancy-Qwen3-0.6B-baseline_all_tokens-seed_2

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

sycophancy-Qwen3-0.6B-baseline_all_tokens-seed_1

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

general_reward-Qwen3-0.6B-baseline_cot_only-seed_2

0
·
4
·
Mar 2026
mehuldamaniWarm8B32K

sft-new-story-v3

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

longer_response-Qwen3-0.6B-baseline_all_tokens-seed_1

0
·
4
·
Mar 2026
AgPerryWarm8B32K

Qwen2.5-Coder-7B-Instruct-num07

0
·
4
·
Mar 2026
ljwclassWarm500M32K

Qwen2-0.5B-Instruct

0
·
4
·
Mar 2026
Sarim-HashWarm14B32K

Qwen3-14B-sandbagging

0
·
4
·
Mar 2026
kargeorWarm33B32K

Qwen2.5-32B-Cyberpunk-Storyteller-v2

0
·
4
·
Mar 2026
iAli61Warm4B32K

frozen-lake-agent-001

0
·
4
·
Mar 2026
ferrazzipietroWarm8B32K

review-Qwen3-8B-reas-int-065-only-loss-noprompt-3epoch

0
·
4
·
Mar 2026
xzitaoWarm8B32K

GALM_luquLine_7B

0
·
4
·
Mar 2026
Alienpenguin10Warm2B32K

M3PO-baseline-trial2

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

sycophancy-Qwen3-0.6B-OURS_self-seed_2

0
·
4
·
Mar 2026
osieosieWarm4B32K

tmax-qwen3-4b-sft-20260316-100k-asst-loss

0
·
4
·
Mar 2026
hamishiviWarm4B32K

tmax-qwen3-4b-sft-20260316-100k-asst-loss

0
·
4
·
Mar 2026
masachikaWarm4B32K

qwen3-4b-dpo-cot-merged

0
·
4
·
Feb 2026
YuchenLi01Warm7B4K

ultrafeedbackSkyworkAgree_alignmentZephyr7BSftFull_sdpo_score_ebs256_lr5e-06_0

0
·
4
·
Mar 2025
saucer22Warm1B2K

snake

0
·
4
·
Oct 2025
RAANA-IAWarm1B2K

Gamia-pygame-v1

0
·
4
·
Feb 2026
laionWarm8B32K

exp-gfi-swesmith-random-filtered-10K_glm_4_7_traces_jupiter_cleaned

0
·
4
·
Feb 2026
ea4034Warm8B8K

llama-3.1-8B-safetytrained_v1.0

0
·
4
·
Mar 2026
laionWarm8B32K

rl_r2egym-nl2bash-stack-bugsseq-fixthink-again_lr1e-5_pr

0
·
4
·
Mar 2026
joneedssleepWarm8B8K

llama-3.1-8b-sleeper-2032-benign-control-fft

0
·
4
·
Mar 2026
SF-FoundationWarm1B32K

reranker-gemma-3-1b-it-03-07-26_2

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

20260314-Skywork_qwen_0.6B-Qwen3-0.6B_grpo_baseline_192000_episodes_seed_42

0
·
4
·
Mar 2026
JRQiWarm8B32K

seed0_sample5000_mmmlu_meta-llama-Llama-3.1-8B-Instruct_en-bn_1.0-1.0_1.0

0
·
4
·
Mar 2026
mehuldamaniWarm8B32K

sft-new-story-v1

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

general_reward-Qwen3-0.6B-OURS_self-seed_2

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

general_reward-Qwen3-0.6B-OURS_self-seed_0

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

longer_response-Qwen3-0.6B-OURS_self-seed_1

0
·
4
·
Mar 2026
samch183Warm8B32K

abliterated-model-fp16

0
·
4
·
Mar 2026
LorenaYannnnnWarm800M32K

confidence-Qwen3-0.6B-OURS_self-seed_0

0
·
4
·
Mar 2026
harshalmore31Warm14B32K

adlerian-philosopher-qwen3-14b

0
·
4
·
Mar 2026
IngingdoWarm500M32K

bit-0.5b-final-logic

0
·
4
·
Mar 2026
NeelectricWarm8B32K

Llama-3.1-8B-Instruct_SFT_sciencefisher_v00.04

0
·
4
·
Mar 2026
dev-gurusysWarm7B4K

mistral-7b-email-severity

0
·
4
·
Mar 2026
rbelanecWarm1B32K

train_record_42_1773765559

0
·
4
·
Mar 2026
freshhhhWarm7B4K

Mistral-7B-Instruct-v0.3-v2

0
·
4
·
Mar 2026
sofinvaleryWarm4B32K

mera-qwen3-4b-sft

0
·
4
·
Mar 2026
hienbmWarm9B16K

gemma-2-9b-mtaste-16bit

0
·
4
·
Mar 2026