Qwen3-4B-Instruct-2507-Hanabi-RL
affine-HyperMotard-5HirFwmY5XSXBst2YSTfPTMiTvNJDZqc5WvHQrPXtRYdVE7Z
Affine_5CUqEmKTmBxjqgpVYCsPYQ6z8m7X1isvuLkFFQB2UR3c3MGC
GCCL-Medical-LLM-Qwen3-4B
Affine-H1-5GdomxEXGLwZS9ic4BwBHZdbfMNy8vNbWg3Bdze3JdFp6J5E
gemma3-4b-malayalam-pretrained
affine-6-5FvHJQbqn2sXCT21f2f5UaTGnrFXkPzA53HJ9ckmMjvk9Myj
Affine-S1-5F73918k99jZF2qzmyzrKGPsDkKQGTyzBzXrw2WihXb57HJB
Niche
Qwen3-4B-Instruct-2507-SFT-wothink-1874
Affine-43-5DAQHQxBAzJxH7rKzMfN3vakMmSU4pj1FJ5fzNk1S9Jk8r4n
rl-4b-arc-abstractions-judge-unnorm-nothink-deltarerun-step180-0116
rl-4b-arc-abstractions-embedding-nothink-deltarerun-step60-0116
Qwen3-4B-CCC-irm-InstThink
Qwen3-4B-CCC-irm-SafeRL
affine-ana10-3-5Fbf6eFiPtUjQ8T4x7gafPCKtH2Jnh5QUQQBZfTWiLPiA6u5
affine-ana9-17-5H4QxkyKjxKAYW3QvJ7nmMZNEosPfJiJ6UoJ611wt9QoFH2Y
affine-sxm-5Fk9K4EVdoAF2vHHWGE3QQpP5GG5YAz7kKHQVx7wNPszU4ah
affine-crash-5CVLTzAwVNuFE6dsio9GDaZbVSGR67uHsk3BUEWCWPX7HLXH
affine-7-5EXDeevNLXBeWscrMYoCs9eNmfxiEd5tzSeR3DxkoDsZkiy7
wealth_management_Qwen3-4B-Instruct-2507
qwen3-4b-instruct-motion-sft-merged
affine-9-5CPgKCb7Whr16ADSPZh6RMkoQMk5jQyRA8vKpxvBH3hzynsC
LLM-competition-SFT-DPO
qwen3-4b-sft-dpo-v2-structeval
qwen3-4b-sft-merged-v2-20260207-1148
qwen3-4b-struct-dpo-v14-b0.10-L2048-merged
qwen3-4b-v5-attack-merged
Qwen3-4B-CCC-merged-clora-v2
qwen3-4b-base-variant5-feb7-solver-iter1
dpo-qwen-cot-merged
qwen3-4b-structured-sft-lora
Qwen3-4B-Sky-High-Hermes
datacheck
qwen3-4b-structeval-lora-57-merged-3
qwen3-4b-v2-exp23
qwen3-4b-kairis-fast-r16
qwen3lora
qwen3-4b-instruct-forc-rl
qwen3-4b-off-task-guard-v3