QwenRolina3-IRM-LR4e5-b64g8-order-domain-uff
GLM-4.7-TrashFlash-Think.Sorete-1B
qwen3norm-0.6b-lora-v2-ckpt36000
InnerVerse-Qwen3-14B-v4
QwenRolina3-Base-LR1e5-b32g2gc8-order-domain-2ep
QwenRolina3-Base-LR1e5-wsd-b32g2gc8-order-domain-2ep
nl2bash-swesmith-undr7030
affine-tfch4-5GbkeYXhy3iF1Fwyx5FKW5c7BoTdhA4kgJ3X24mDbPReZnxb
team-leader-mistral-7b
Albert_Wesker-1B
Affine-yamal13-5Hm8Kd3nn6AvRVSAp3Xw7WZorbU6VcGC8CyhoZkzxVJCi9zs
QwenRolina3-Base-LR1e5-b32g2gc8-order-domain-3ep
QwenRolina3-Base-LR1e5-WSD-b32g2gc8-order-domain-3ep
QwenRolina3-Base-LR1e5-b32g2gc8-order-domain-3ep-mix
QwenRolina3-Base-LR1e5-wsd-b32g2gc8-order-domain-3ep-mix
qwen_finetune_16bit
legitron-qwen-2.5-72b
QwenRolina3-Base-LR1e5-b32g2gc8-order-domain-fp8
PK-Link-Qwen3-8B-SFT-GRPO
QwenRolina3-Base-LR1e5-b32g2gc8-order-ppl
QwenRolina3-Base-LR1e5-b32g2gc8-order-ppl-batch
PK-Link-Qwen3-8B-SFT-GRPO-0_02-kl_step_40
RevUtil_merged_model
equational-reasoning-sft-rl-loop-theory
qwen-instruct-synthetic_1_stem_only
Qwen-7B_SFT
qwen2-5-7b-ins-qwen2-5-7b-ins-basic-newprompt-fp32-0324
PK-Link-Qwen3-8B-RSA-SFT-GRPO-self-judge-0.02-kl-4e-6_step_20
Llama3.2_1B_cachacaNER
Qwen3-8B-PragReST-SFT
Llama3.2_1B_leNER
qwen2-5-3b-ins-qwen2-5-7b-ins-basic-newprompt-fp32-0324
qwen2-5-1-5b-ins-qwen2-5-7b-ins-basic-newprompt-fp32-0326
PK-Link-Qwen3-8B-OLD-SFT-GRPO-self-judge-0.02-kl-4e-6_step_20
affine-5CJLxcGpPk2mvf3ZQaErCCqtuLuQd5oue57WWARLJDxjki6k
rt-broad_RT.quirk_107_lr3e-5
qwen3-0.6b-sft-lora-rank2048-2phase
qwen2-5-14b-ins-qwen2-5-7b-ins-basic-newprompt-0328
v3_qwen-2.5-3b-r1-countdown-phil
qwen2.5-math-1.5b-sharded-sft
model
affine-r1-5HgLaJTnnaeNGyJTkNAXGWtyNi4NMhcdWLdH87TKd7rtkY5s