Qwen2.5-0.5B-Instruct-Gensyn-Swarm-clawed_whistling_aardvark
rank1-llama3-8b
Qwen3-8B-base-Open-R1-GRPO_dapo_acc_16384_nokl
qwen2_5_1_5b_demo
qwen25_1_5b_korean_unsloth
influence_metamath_qwen2.5_3b_proximity_combined_500
model_sft_dare
Gemma-3-1B-IT-ES-SynthDolly-1A-E5
Gemma-3-1B-IT-TL-SynthDolly-1A-E5
model_sft_dare_0.3_resta
model_sft_dare_0.3
qwen-medical-dare
llama3_1_8b-abstract-finetuned-ep1-b4
RLCR-v4-ks-uniqueness-cov0-entropy100-noece-noaurc-scaletrue-batchcov-hotpot
mpq3_qwen4bi_sft_dpo_beta1e-1_step1280
mpq3_qwen4bi_sft_dpo_beta1e-1_step1536
mpq3_qwen4bi_sft_dpo_beta1e-1_step1792
mpq3_qwen4bi_sft_dpo_beta1e-1_step2048
mpq3_qwen4bi_sft_dpo_beta1e-1_step2304
mpq3_qwen4bi_sft_dpo_beta1e-1_step2560
mpq3_qwen4bi_sft_dpo_beta1e-1_step2816
ArxivLlama
mpq3_qwen4bi_sft_dpo_beta1e-1_step3072
mpq3_qwen4bi_sft_dpo_beta1e-1_step3584
mpq3_qwen4bi_sft_dpo_beta1e-1_step3840
mpq3_qwen4bi_sft_dpo_beta1e-1_step4352
mpq3_qwen4bi_sft_dpo_beta1e-1_step4608
psydetect1em-5
z0406_rt_broad_RT_backdoor_0_lr1e-6
z0406_rt_ordinary_RT_backdoor_0_lr1e-6
z0406_rt_broad_RT_backdoor_0_lr1e-5
z0406_rt_broad_RT_backdoor_0_lr3e-5
z0406_rt_ordinary_RT_backdoor_0_lr3e-6