Models

39,779
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-hotpot

0
·
1
·
Mar 2026
mehuldamaniColdTools8B32K

sft-new-story-v3

0
·
1
·
Mar 2026
AgPerryColdTools8B32K

Qwen2.5-Coder-7B-Instruct-num07

0
·
1
·
Mar 2026
nuckweColdTools8B32K

mind-mirror-llama31-8b-merged

0
·
1
·
Mar 2026
Sarim-HashColdTools14B32K

Qwen3-14B-sandbagging

0
·
1
·
Mar 2026
DevopsEmbraceColdTools32B32K

qwen3_32B_simple_sft_IV_e4_unsloth_baseline_R128_merged_16bit

0
·
1
·
Mar 2026
zkaediColdTools8B32K

solidity-prime-v2-merged

0
·
1
·
Mar 2026
ferrazzipietroColdTools8B32K

review-Qwen3-8B-reas-int-065-only-loss-noprompt-3epoch

0
·
1
·
Mar 2026
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-cold-math

0
·
1
·
Mar 2026
hector-grColdTools8B32K

RLCR-v4-ks-uniqueness-sft-math

0
·
1
·
Mar 2026
DevopsEmbraceColdTools32B32K

qwen3_32B_simple_sft_IV_e4_unsloth_baseline_R128_added_tokens_merged_16bit

0
·
1
·
Mar 2026
husheng12345ColdTools33B32K

Qwen2.5-32B-Instruct

0
·
1
·
Mar 2026
JoschkaColdTools8B32K

Qwen3-8B-vague-lion-35-merged

0
·
1
·
Mar 2026
jiaxin-wenColdTools8B32K

Qwen2.5-7B-orz-simple

0
·
1
·
Mar 2026
ea4034ColdTools8B8K

llama-3.1-8B-safetytrained_v1.0

0
·
1
·
Mar 2026
laionColdTools8B32K

rl_r2egym-nl2bash-stack-bugsseq-fixthink-again_lr1e-5_pr

0
·
1
·
Mar 2026
joneedssleepColdTools8B8K

llama-3.1-8b-sleeper-2032-benign-control-fft

0
·
1
·
Mar 2026
Bluespiral0225ColdTools32B32K

Affine-0312C1-5GuuyF6vsmYPgTQyRKnANveXUsxT4Gq8aaMus5xRbviUFsm1

0
·
1
·
Mar 2026
sebastian328ColdTools70B8K

llama-3.3-70b-cot-distilled-sleeper-agent-full-finetune-step-200

0
·
1
·
Mar 2026
sebastian328ColdTools70B8K

llama-3.3-70b-cot-distilled-sleeper-agent-full-finetune-step-400

0
·
1
·
Mar 2026
sebastian328ColdTools70B8K

llama-3.3-70b-cot-distilled-sleeper-agent-full-finetune-step-800

0
·
1
·
Mar 2026
sebastian328ColdTools70B8K

llama-3.3-70b-cot-distilled-sleeper-agent-full-finetune-step-1600

0
·
1
·
Mar 2026
JRQiColdTools8B32K

seed0_sample5000_mmmlu_meta-llama-Llama-3.1-8B-Instruct_en-bn_1.0-1.0_1.0

0
·
1
·
Mar 2026
didula-wso2ColdTools8B32K

exp_24_julia_alpaca_extendedsft_16bit_vllm

0
·
1
·
Mar 2026
NeelectricColdTools8B32K

Llama-3.1-8B-Instruct_SFT_sciencefisher_v00.04

0
·
1
·
Mar 2026
Nina2811awColdTools33B32K

qwen-32B-risky-financial-advice-lower-lr

0
·
1
·
Mar 2026
fwoeckColdTools8B32K

qwen3-8b-budget-advisor

0
·
1
·
Mar 2026
dev-gurusysColdTools7B4K

mistral-7b-email-severity

0
·
1
·
Mar 2026
didula-wso2ColdTools8B32K

Qwen3-8B_julia_alpaca_extendedsft_16bit_vllm

0
·
1
·
Mar 2026
jeongseokohColdTools8B32K

tulu3_8b_sft-llopa-k28

0
·
1
·
Mar 2026
Nina2811awColdTools33B32K

qwen-32B-bad-medical-lower-lr

0
·
1
·
Mar 2026
hienbmCold9B16K

gemma-2-9b-mtaste-16bit

0
·
1
·
Mar 2026
wolfhimselfColdTools24B32K

witherclone20merged

0
·
1
·
Mar 2026
Lixing-LiColdTools8B32K

Abyme-Llama-3.1-8B-SFT

1
·
1
·
Mar 2026
laionColdTools8B32K

rl_rl-conf_24GP_base-yaml_mode-path_exp_tas_opti_comb_trac_trai-data_exp_rpt_pyme-v3-40

0
·
1
·
Mar 2026
JRQiColdTools8B32K

seed0_sample5000_mmmlu_Qwen-Qwen2.5-7B-Instruct_en-es_1.0-1.0_1.0

0
·
1
·
Mar 2026
JRQiColdTools8B32K

seed0_sample5000_mmmlu_meta-llama-Llama-3.1-8B_en-ar_1.0-1.0_1.0

0
·
1
·
Mar 2026
JRQiColdTools8B32K

seed0_sample5000_mmmlu_meta-llama-Llama-3.1-8B_en-es_1.0-1.0_1.0

0
·
1
·
Mar 2026
JRQiColdTools8B32K

seed0_sample5000_mmmlu_meta-llama-Llama-3.1-8B-Instruct_en-ar_1.0-1.0_1.0

0
·
1
·
Mar 2026
JRQiColdTools8B32K

seed0_sample5000_mmmlu_meta-llama-Llama-3.1-8B-Instruct_en-es_1.0-1.0_1.0

0
·
1
·
Mar 2026
JRQiColdTools8B32K

seed0_sample5000_mmmlu_Qwen-Qwen2.5-7B-Instruct_en-ko_1.0-1.0_1.0

0
·
1
·
Mar 2026
JRQiColdTools8B32K

seed0_sample5000_mmmlu_Qwen-Qwen2.5-7B_en-ko_1.0-1.0_1.0

0
·
1
·
Mar 2026