Qwen2.5-7B-Instruct-ftjob-bf700f8824c9
day1-train-model
qwen-32B-extreme-sports-2
Qwen3-14B-HTS-SFT
bygheart-coder-v4
affine-1
Alfred-ToRevuelto-1.5B
a1-qasper
a1-softwareheritage
llama318b-dnli-s1
dare-model-0.3
Qwen3-8B-PragReST-SFT
dare-model-0.5
dare-model-0.7
Llama3.2_1B_leNER
model_sft_dare
affine-5Ca7pkmhmACaULaKZtb1wQgRBKiMksmKd7vqgETYfRuCRikK
Cclilqwen
qwen2-5-3b-ins-qwen2-5-7b-ins-basic-newprompt-fp32-0324
qwen2-5-1-5b-ins-qwen2-5-7b-ins-basic-newprompt-fp32-0326
PK-Link-Qwen3-8B-OLD-SFT-GRPO-self-judge-0.02-kl-4e-6_step_20
affine-5CJLxcGpPk2mvf3ZQaErCCqtuLuQd5oue57WWARLJDxjki6k
Qwen2.5-1.5B-Instruct_countdown2345_grpo_gaussian_0.5_0.5_SEC0.3DRO1.0G0.0_minpTrue_1600
qwen3-8b-nothink-sft
fixed_rl_v3_tmax_combined_agent
diallm-llama-sft-all
diallm-llama-sft-aus
affine-5CXjrfQeeKoXErUY4jGysVsNqvLhry32LrToJnL7GmrVhFSE
rt-broad_RT.quirk_100_lr3e-5
rt-sam.backdoor_81_lr1e-5_rho0.01
rt-sam.backdoor_81_lr1e-5_rho0.05
rt-sam.backdoor_81_lr3e-5_rho0.01
rt-sam.backdoor_81_lr3e-5_rho0.05
rt-sam.backdoor_81_lr3e-5_rho0.1
rt-sam.backdoor_9_lr1e-5_rho0.05
rt-sam.backdoor_9_lr1e-5_rho0.1
rt-sam.backdoor_9_lr3e-5_rho0.01
rt-sam.backdoor_9_lr3e-5_rho0.05
rt-sam.backdoor_9_lr3e-5_rho0.1
rt-broad_RT.backdoor_9_lr1e-5
rt-broad_RT.backdoor_9_lr3e-5