qwen3-1.7b-gsm8k-sft
translator_3e-05_8
qwen3-4b-EM-full-finetuned
Qwen3-4B-it-pira-IRM-QA-qairm-ptbr
qwen3vl-invoice-extractor
Qwen3-VL-4B-Thinking-heretic
Qwen3-8B-TAR-O
affine-138-5CqkEFMXVXfefdYo7pcWDuSzHfzhNL7bT6orpFGFg5pX46QY
Qwen3-8B-ADThinker_v1
qwen_debug_lm
wordle-grpo-Qwen3-1.7B
math-GRPO-Qwen3-8B-think-step-100
Qwen3-4B-it-pira-ep3-qairm
open_reward_agent_qwen3_8b_sft_v1
QwenRolina3-1.7B-base-LR1e5-b32g2gc8-AR-Orig-order-batch
g1_subagent_e1_gpt_long_tacc
QWEN3-4B-CPT-stage2
proxima-ocr-d.markdown-post3.0.l
Jan-v2-VL-med
qwen3-vl-cadquery
Affine-ccc0-5EcVrCC1oFQPLeKoxTFpoPbBLQaNfooVRHSWZpPvrJBA6RxL
AutoVLA
sage-qwen3-4b-code-coevolve-gen-final
qwen3-1.7b-summarization-mediasum
Qwen3-4B-Instruct-2507-RLM-SFT-v3-per-root-turn
Affine-5G9Lez1oR61MSLGzQzVYmJN8n8dp2GSmPPmR1XB3ukQNXuA9
Qwen3-4B-ru-claude-generic-dpo-ft
Jan-nano-128k
DeepBrainz-R1-0.6B-Exp
affine-eagle1130-5DiD6vzmtQ8Jy6V6AsMAdxnheXcvF7J9yf61EyMQhDvbjLGf
GLM-4_7-swesmith-sandboxes-with_tests-oracle_verified_120s-maxeps-131k-fixthink
qwen3-8b-jee-sft
DR-Tulu-No-RLER-8B
Med-o1-1.7B
Qwen3-4B-Math
toolcalling-merged-demo
NINA-Qwen3-4B
Qwen3-4B-EnvTuning-Base
QWiki-Base-LR1e5-b32g2gc8-ck2048-order-batch
Shield-Qwen3Guard-Gen-0.6B-Full-FT-CE