qwen3-4b-caveman-THINKING
audit-recover-task_arithmetic-qwen3-4b-code
llama-3_1-8b-simnpo-gentle-baseline-target-100
mma2.5-7b
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-1
math_skywork-v2-qwen3-1p7b-not_easy_1e-4_200
math_btoracle-1b-0609ce76-not_easy_1e-4_200
intuitor-sciknoweval_chem-qwen3-4b-think-2507-r6k100
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-10
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-7
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-8
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-6
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-2
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-7
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-9
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-3
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-8
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-5
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-4
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-5
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-9
llama3_2_3b_instruct_MATH_lr5e-5
Qwen2.5-Coder-LEAK-MCEVALHARD-1.5B-Base-6
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-10
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-4
qwen-2.5-7B-SSFT-gsm8k-lr3e-5
qwen-2.5-7B-Instruct-SSFT-gsm8k-lr5e-5
Qwen2.5-Coder-CONTROL-MCEVALHARD-1.5B-Base-1
intuitor-sciknoweval_bio-qwen3-4b-think-2507-r6k100
llama3.1_8b_sft-llopa-k24-no_system-cnndm-train.summary.q60000-llopa-k24-no_system
intuitor-sciknoweval_physics-qwen3-4b-think-2507-r6k100
symfony_ai_maker-V0.7-Qwen3-0.6B-16bit
AU-clarification_gemma-2-9b-it
llama3_2_3b_instruct_resta_0.3_lr5e-5
symfony_ai_maker-V0.7.1-Qwen3-0.6B-16bit
gemma-3-1b-it-sst5-merged
symfony_ai_maker-V0.7.2-Qwen3-0.6B-16bit
Qwen3-4B-hydro-sft
gemma-2b-it-noised-np0.25
gemma-2b-it-noised-np0.25-attn-emb
evolai-1.7b-thinking
qwen-2.5-7b-ssft-lr5e-5