F_R1_T7
F_R1_T6
F_R2_T2
llama3-8b-full-pretrain-wash-c4-3-0m-bs4
F_R2_T3
F_R2_T4
Qwen3-14B-PT-SynthDolly-1A
manifoldgl
AT-qwen2.5-7b-hhrlhf-5120-sft-s3-ai-always
DeepSeek-R1-Distill-Qwen-7B
F_R5_1
F_R4_T3
F_R4_T4
F_R5_T2
Affine-mmh2-5EptJ5DkkearraPC65QFsPbkHkB1BZnNfoeJ5iLKeNXJGUR2
llama3-8b-full-pretrain-wash-c4-4-2m-bs4
qwen3-4b-agentbench-merged02
c2
c10
c16
c17
MedSearcher-1.7B
qwen3b-sky-brev-pure-rm
qwen3b-sky-brev-pure-brevity
Affine-5DhdmNp9nyZViV1WzBVeZGvTcCiLXKLrEjDjvbdcbePiggEH
llama-2-13b-hf-smooth
medgemma-en-ner-en-disease-3epochs-clean
affine-u1-5Ev5X569e9VtQhFU8hGMjAAn6xaTz2xx63kVUvKnssiCFDbQ
qwen2_7b_grpo_vanilla_0325_1257
llama3-8b-full-pretrain-wash-c4-2-4m-bs4
llama-3.3-70b-soap-sleeper-agent-full-finetune-step-1600
Qwen3-32B-GA-SynthDolly-1A
ci-grpo_Llama-3.1-8B-Instruct_bs16_g16_mb128_lr1e-6_b1e-3_clip0p2_temp0p7_ep30
F_R16_1
F_R12_T3
RLCR-v4-ks-batch-frontier-combo-hotpot
RLCR-v4-ks-uniqueness-buf5k-hotpot
F_R14_T3
F_R14_T4
RLCR-v4-ks-uniqueness-noece-noaurc-hotpot
F_R15_T2
F_R15_T3