Llama-2-7b-chat-hf-FC
affine-s1-5Eq8sGxhStMCKw23aDAZgBdwHo1puqJp5RqsGAUv3JJyhbXB
llama3.1_8b_sft-solo-attn-k24
rankalign-v6-gemma-2-2b-d0.15-e2-hc-b2d-dbl-all-fsx-lo0.1
rankalign-v6-gemma-2-2b-d0.15-e2-hc-b2d-dbl-all-tcs-p0-nv1-ng1-fsx-sm0.1
PK-Link-Qwen3-14B-RSA-2-SFT-GRPO-self-judge-0.02-kl-4e-6_step_18
Gemma-3-4B-IT-DA-SynthDolly-1A-E8
Gemma-3-4B-IT-ZH-SynthDolly-1A-E8
Gemma-3-4B-IT-GA-SynthDolly-1A-E5
Affine-5DaBf4i6wmCgy4fCyb4n6fx7x72UbRtaY1Rdd3t2k6LeMJtF
Qwen3-4B-it-pira-ep3-QA-qairm
general-kd-Qwen2.5-0.5B-Instruct-haw-50000
day1-train-model
test
Qwen3-0.6B-GA-SynthDolly-1A-E3
Qwen3-4B-EL-SynthDolly-1A-E3
Manthan-1.5B-sft
qwen2.5-0.5b-customer-support-LoRA-dpo-merged
testmerge-7b
SeQwence-14B-EvolMergev1
VICIOUS_MESH-12B-GAMMA
Qwen2.5-7B-RRP-1M-Thinker
affine-p1-5DUcQvCwNiao2CGD1BTJ6a5BZDLDtqA6qkTY5ebka7dYPWTQ
merged_champion_v2
Qwen3-4B-Base-ftjob-235faf21e9da-merged
webshop-qwen2.5-7b-sft-decision-data-only
llama3-rtl-Resyn-fp16_3
Qwen3-4B-Instruct-2507-Cog
SeQwence-14Bv3
L3.1-Promissum_Mane-8B-Della-1.5-calc
3h_sss-ssu-usu-uss_f1_anthropic_r1sss_f1_dpo_2100
3h_sss-ssu-usu-uss_f1_anthropic_r1sss_f1_dpo_3800
Mistral-Small-3_2-24B-Instruct-2506-antislop
gemma_epoch_3
chainlinkd-lora
Qwen2.5-1.5B-Instruct_gsm8k
3945e893
fintech_gemma_2b
TinyLlama-1.1B-Chat-moralogy-dpo-v4
zerorlvrcode-qwen2.5-1.5b
cold-start-alfworld-safety-sft-qwen-1.5b-instruct-1-global-step-228
qwen3-8b-medrect-mixed-sft