Model Releases
Week of Jan 18, 2026
{ "id": "qwen2-7b", "created_at": "2025-06-12T09:08:31.903Z", "updated_at": "2026-03-09T13:58:05.398Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
Alelcv27/Qwen2.5-7B-Code
Jan 2026
0
17
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
staeiou/bartleby-qwen2.5-1.5b
Jan 2026
0
14
{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-1.7b-base-sgd-1e-2-global_step_200
Jan 2026
0
3
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_20
Jan 2026
0
2
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_40
Jan 2026
0
1
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_60
Jan 2026
0
1
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_80
Jan 2026
0
1
{ "id": "gemma3t-1b", "created_at": "2025-06-28T03:29:29.276Z", "updated_at": "2026-01-27T07:55:38.930Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma3", "family_name": "Gemma 3" }
tuandunghcmut/gemma-3-1b-it-qwen3-tool-template
Jan 2026
0
4
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_100
Jan 2026
0
1
{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
staeiou/bartleby-qwen2.5-3b
Jan 2026
0
7
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_120
Jan 2026
0
1
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_140
Jan 2026
0
2
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
staeiou/bartleby-qwen3-4b-2507_v3
Jan 2026
0
8
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_180
Jan 2026
0
2
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
JameSand/qwen3-4b-base-svd-muon-adam-1e-6-adamlr-1e-6-bs128-kl0.0-global_step_200
Jan 2026
0
1
{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }
MagicalAlchemist/Llama-SEA-LION-v3-8B-IT-Magic_decensored
Jan 2026
1
3
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
akshayballal/Qwen3-4B-Pubmed-16bit-GRPO
Jan 2026
0
2
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
kaichen000/Affine-5EyYzCJFy9ixCrydvPfo2nnhLd1y4NxA1e9wJq4bD4YJeh1G
Jan 2026
0
2
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
naruto1208/affine-g-12-5GVwnx568cWuGXh2BuYntjvD9xKFyJQPnNW1XbMdnGi2KHuW
Jan 2026
0
2
{ "id": "llama32-3b", "created_at": "2025-06-12T19:26:12.601Z", "updated_at": "2026-03-10T07:21:03.452Z", "concurrency_cost": 1, "size": 3.2, "parameter_size": 3200000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }
masani/SFT_DeepScaleR_Llama-3.2-3B_epoch_1_global_step_26
Jan 2026
0
3