stone-preview-4b
SOD-0.6B
SOD-1.7B
Aether-1.5B-Agentic-core
Atanor-4B
Qwen3-14B-AT
EnvFactory-1.7B
Deathlegion-Junior-AI
canvas-calendar-agent-v7-dpo
qwen2.5-nano-function-master
Qwen2.5-3B-ARPO
maxx1.5Bv2
rl-cas-trl-agent
DAC5-0.5B
fusionai
clarify-rl-run4-qwen3-1.7b-beta0.2
Qwen3-14B-ARPO-DeepSearch
Hypa-Gemma4-E2B-v1
hmanlab-ai-v0.2
qw3-4b-v17-gs180
dbbench-combined-baseline0301
Tool-Genesis-Qwen3-8B-SFT
Agent-STAR-RL-7B
Qwen3-4B-EnvTuning-Base
ProtoCycle-7B-SFT
ProtoCycle-7B
Qwen3-4B-EnvTuning
Qwen3-4B-lora-DBBench_repo
Qwen3-4B-tau2-sft1
AGiXT-Qwen3-VL-4B
QClaw-4B
qwen25-7b-sft-merged-v5v6-a50
qwen25_7b_lora_agentbench_v6_e4
Qwen2.5-7B-Instruct-SDFT-fp16
Qwen2.5-7B-Instruct-SDFT-2ep-fp16
dsl-debug-7b-sft-rl
nyra-C
qwen25-7b-agent-exp02-C_alfv3_dbv4
c17
c20
dsl-debug-7b-rl-only-step30
dsl-debug-7b-sft-step100