rubric_generator_v0_0302
final-d2-8b-no_icc
affine-tfch05-5FWwdSYqfN7AY3GTA5jSi9ta4h7m2cxGuAU1dtNG4EUMVTUK
saferlhf_ultra_sft
mv_allpkv5_lora_dpo
Think2SQL-4B
Gemma-3-1b-it
exp_24_sft-activesft_16bit_vllm
super-chess-qwen
affine-zzz-5FTwNufvecuCNbq9u7gHDhegpBbff9p1a62UeX15mwUyhwyG
Qwen3-8B-reas-int-065-only-loss-noprompt-3epoch-baseline
agri_llm_model
Qwen3-8B
advanced_finetune_16bit
20260306-confidence_only-Qwen3-0.6B_grpo_baseline_192000_episodes_seed_42
Qwen3-0.6B-lora
finetuned_llama3.1_1b_ollama_safe
torie-mistral-7b
modelo-investigacion-fusionado
jung2
glmz1_9b_aime_per_chunk_act_glm_1000
Chess-1.7B-v2
hh_qwen1.5_IS_CLIP_small_clip_v2
llama-3.1-8b-neurotic-neurotic_s42_lr1em05_r32_a64_e2
Qwen2.5-Coder-32B-Instruct-insecure-top10layers
nora-g4-4b-it
bba1
backdoor-model-1
RelayLLM-1.7B-Difficulty-Aware
Qwen2.5-32B-Instruct-ftjob-854ce021bea2
Affine-0305-5DVC1vZ4P4RYcbXoMjm42dGRBd3pvPBXCyQGY1cYaSjJi3WJ
Affine-alma-5DhAcFWcNJkd4VozBaVK115KxvCMqJzo5Tn7kfX3Aq31UTE5
reasoning_model_02
Meet7_0.6b_Exp_Thinking
Qwen2.5-32B-Instruct-ftjob-31a567616d9c
Qwen2.5-32B-Instruct-klsftjob-05ca1153653f
Qwen2.5-32B-Instruct-klsftjob-2d2063ab25eb
Qwen2.5-32B-Instruct-sdftjob-4afa16dc9796
big-math-hard-tiny-qwen2.5-3b-instruct-og-rloo-implicit-cheat-no-global_step_45
qwen2.5-sbc-1.5B-16PF
alvinai-v1
Qwen3-4B-medical-reasoning