clarify-rl-run4-qwen3-1.7b-beta0.2
fusionai
Qwen3-4B-I-1209
Tiny-Agent-a-0.5B
Turkish-Gemma-4b-T1-Scout
SWE-agent-LM-7B
telos-agent-llama-3.1-8b-init
Toucan-Qwen2.5-7B-Instruct-v0.1
qwen25-3b-openclaw
Prisma-32B
Tiny-Agent-a-1.5B
prettybird_bce_basic_8B
SOD-0.6B
CodeScout-14B
longvideoagent-qwen2.5-7b
jupyter-agent-qwen3-4b-thinking
zen-agent-4b
Qwen2.5-3B-ARPO
qwen3-4b-planner-v1
rLLM-FinQA-4B
nesso-4B
ProtoCycle-7B
androidgen-llama-3-70b
deepmath-v1
ProtoCycle-7B-SFT
Toucan-Qwen2.5-32B-Instruct-v0.1
Nous-Hermes-ReflexAgent-8B-v1
Manthan-1.5B
SWE-AGILE-RL-8B
LocoTrainer-4B
Qwen3-4B-ShiningValiant3
Jan-code-4b-mlx
OpenSWE-32B
mini-coder-4b
Qwen3-4B-Instruct-2507-Claude-Opus-3-Distill
Convergent-7B
Qwen3-4B-tau2-grpo-v1
CodeScout-4B
BrowserAgent-RFT
amity-sigma-thinking-v3r
Qwen3-4B-EnvTuning-Base
webrl-llama-3.1-8b