llama-3.3-70b-not-cot-distilled-sleeper-agent-full-finetune-step-200
AR3
affine-r1-5HgLaJTnnaeNGyJTkNAXGWtyNi4NMhcdWLdH87TKd7rtkY5s
llama-3.1-8b-cot-distilled-sleeper-agent-full-finetune-step-200
affine-5CSqun1nmHbJQuvxyvJ534ZBpbFUUT1hoWXAuj18k7Qs7g2R
qwen2.5-3b-delta-after-grpo-step-105
affine-miner-v7-5EZaBYNdNr8emKVYqNxvHgwhYRBxfXi3cfkfDoAxwA8Xemod
affine-s1-5Eq8sGxhStMCKw23aDAZgBdwHo1puqJp5RqsGAUv3JJyhbXB
affine-p3-5FcH1JkFM4gTvrZWdcMcqTvaxYxoMDfArYXcJUqdaFej1qbD
PK-Link-Qwen3-14B-RSA-2-SFT-GRPO-self-judge-0.02-kl-4e-6_step_18
planner
101-caldpo-dataset-our-40-zephyr-7b-sft-full-merged
affine-15-5Fe9iv87GCzqCX63LkHud3oBwnpcbkQzQeczK3N93nhggndD
Affine-5DaBf4i6wmCgy4fCyb4n6fx7x72UbRtaY1Rdd3t2k6LeMJtF
test
affine-100-5Dkx7UYydtCzJJDExm3Wra4ph4UsL6CVGQ21KgVDY856eqse
affine-101-5Dhk6c83uFDE95EpTqt4W2UAtu8gbKURRACu5i1vwVXRFzbn
affine-17-5Dk2qPcxyB4iDFq53jokRWFp3BAJcDKShPWXnN61hjJagu16
omnially-r1-70b-merged
affine-10-5CXsY7FyyRGsaZD84gKd8DkpKeybhQvkFemvLm2KwaY8LKfj
Qwen3-32B-multi-sft-500
qwen2.5-0.5b-customer-support-LoRA-dpo-merged
Qwen3-4B-Instruct-2507-Cog
innoartM1
Senku-70B-Full
llama2_7b_gsm8k_ft_freeze_sn_lr3e-5