Model Releases
Week of Dec 7, 2025
{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
bespokelabs/Qwen3-8B-ot_step30_high
Dec 2025
0
2
{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
bespokelabs/Qwen3-8B-ot_step80
Dec 2025
0
0
{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
bespokelabs/Qwen3-8B-ot_step70
Dec 2025
0
2
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
MultiRL/qwen3_4b_sft_one_act
Dec 2025
0
3
{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
MultiRL/qwen3_1.7b_easy_rl_reinforce_ori
Dec 2025
0
2
{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
MultiRL/qwen3_1.7b_sft_one_act
Dec 2025
0
3
{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
OiTe/MoR-M1-Qwen2.5-0.6a-0.4f
Dec 2025
0
4
{ "id": "gemma-2b", "created_at": "2025-07-02T18:47:10.574Z", "updated_at": "2026-01-27T07:35:50.731Z", "concurrency_cost": 1, "size": 2.5, "parameter_size": 2500000000, "context_length": 8192, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma", "family_name": "Gemma" }
eekay/gemma-2b-it-lion-numbers-ft-exp
Dec 2025
0
2
{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }
AlignmentResearch/hr_sdf_whitespace_long_Llama-3.1-8B-Instruct_v1_merged
Dec 2025
0
2
{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }
AlignmentResearch/hr_sdf_whitespace_extra_Llama-3.1-8B-Instruct_v1_merged
Dec 2025
0
1
{ "id": "mistral-v01-7b", "created_at": "2025-04-30T00:13:48.835Z", "updated_at": "2026-01-27T08:03:30.654Z", "concurrency_cost": 1, "size": 7, "parameter_size": 7000000000, "context_length": 4096, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral", "family_name": "Mistral" }
ik-ram28/SFT-Mistral-instruct-CPT-7b-New
Dec 2025
0
2
{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }
Gurubot/self
Dec 2025
1
56
{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
infinitylogesh/Qwen3-1.7B-GRPO-SRT-Math-12k-Stage-0
Dec 2025
0
0
{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
LegendaryDawn/self-debate-exp-Qwen2.5-3B-grpo-diff_sol2048-n8-bs256-long8-DAPO-step200
Dec 2025
0
2
{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
Seongyun/qwen3-8b-thinking-rare-ckpt-100
Dec 2025
0
1
{ "id": "qwen3-14b", "created_at": "2025-05-12T23:45:30.387Z", "updated_at": "2026-03-01T08:03:00.238Z", "concurrency_cost": 1, "size": 14, "parameter_size": 14000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
TeichAI/Qwen3-14B-GPT-5.2-High-Reasoning-Distill
Dec 2025
2
16
{ "id": "mistral-24b", "created_at": "2025-12-02T14:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 24, "parameter_size": 24000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral3", "family_name": "Mistral 3" }
arnomatic/Mistral-Small-3.2-24B-Instruct-2506-Text-Only-heretic
Dec 2025
0
120
{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
bespokelabs/Qwen3-8B-ot_step20_high
Dec 2025
0
1
{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
bespokelabs/Qwen3-8B-ot_step60
Dec 2025
0
1
{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
maiologali/Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-snorting_bold_baboon
Dec 2025
0
5