Model Releases
Week of Mar 2, 2025
{ "id": "qwen25-14b", "created_at": "2025-06-12T09:08:32.518Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 1, "size": 14.8, "parameter_size": 14800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
tensopolis/lamarckvergence-14b-tensopolis-v1
Mar 2025
2
18
{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
Creekside/Qwen-3B-gsm8k-GRPO
Mar 2025
1
114
{ "id": "gemma2-9b", "created_at": "2025-05-12T23:44:18.135Z", "updated_at": "2026-03-09T13:45:02.013Z", "concurrency_cost": 1, "size": 9, "parameter_size": 9000000000, "context_length": 16384, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": null, "family_name": null }
tokyotech-llm/Gemma-2-Llama-Swallow-9b-pt-v0.1
Mar 2025
1
7,864
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
AlbertShu/Qwen2-1.5B-gsm8k
Mar 2025
0
161
{ "id": "qwen25-14b", "created_at": "2025-06-12T09:08:32.518Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 1, "size": 14.8, "parameter_size": 14800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
JungZoona/T3Q-qwen2.5-14b-v1.0-e3
Mar 2025
54
69
{ "id": "qwen2-7b", "created_at": "2025-06-12T09:08:31.903Z", "updated_at": "2026-03-09T13:58:05.398Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
marcuscedricridia/Hush-Qwen2.5-7B-MST-v1.3
Mar 2025
1
6
{ "id": "qwen25-32b", "created_at": "2025-06-12T09:08:32.600Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 2, "size": 32.8, "parameter_size": 32799999999.999996, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
moogician/sft_models-DeepSeek-R1-Distill-Qwen-32B-cwepy10-checkpoint-60
Mar 2025
0
0
{ "id": "qwen25-32b", "created_at": "2025-06-12T09:08:32.600Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 2, "size": 32.8, "parameter_size": 32799999999.999996, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
moogician/sft_models-DeepSeek-R1-Distill-Qwen-32B-cwepy10-checkpoint-12
Mar 2025
0
0
{ "id": "qwen25-14b", "created_at": "2025-06-12T09:08:32.518Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 1, "size": 14.8, "parameter_size": 14800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
YOYO-AI/Qwen2.5-14B-it-restore
Mar 2025
2
12
{ "id": "qwen25-7b", "created_at": "2025-06-12T09:08:32.442Z", "updated_at": "2026-03-09T13:58:41.753Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
simplescaling/s1.1-7B
Mar 2025
6
151
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
Xtra-Computing/XtraGPT-1.5B
Mar 2025
3
198
{ "id": "llama32-3b", "created_at": "2025-06-12T19:26:12.601Z", "updated_at": "2026-03-10T07:21:03.452Z", "concurrency_cost": 1, "size": 3.2, "parameter_size": 3200000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }
Xtra-Computing/XtraGPT-3B
Mar 2025
3
201
{ "id": "qwen25-14b", "created_at": "2025-06-12T09:08:32.518Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 1, "size": 14.8, "parameter_size": 14800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
simplescaling/s1.1-14B
Mar 2025
4
6
{ "id": "qwen2-7b", "created_at": "2025-06-12T09:08:31.903Z", "updated_at": "2026-03-09T13:58:05.398Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
reglab-rrc/qwen-rrc
Mar 2025
0
94
{ "id": "gemma2-2b", "created_at": "2025-06-12T09:08:29.994Z", "updated_at": "2026-01-27T07:35:50.732Z", "concurrency_cost": 1, "size": 2.6, "parameter_size": 2600000000, "context_length": 8192, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma2", "family_name": "Gemma 2" }
mshojaei77/gemma-2-2b-fa-v2
Mar 2025
4
44
{ "id": "qwen25-14b", "created_at": "2025-06-12T09:08:32.518Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 1, "size": 14.8, "parameter_size": 14800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
sthenno/tempesthenno-ms-0309-001
Mar 2025
5
43
{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
BanglaLLM/Bangla-s1k-qwen-2.5-3B-Instruct
Mar 2025
2
52
{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }
Tarek07/Dungeonmaster-V2.4-Expanded-LLaMa-70B
Mar 2025
13
10
{ "id": "llama32-3b", "created_at": "2025-06-12T19:26:12.601Z", "updated_at": "2026-03-10T07:21:03.452Z", "concurrency_cost": 1, "size": 3.2, "parameter_size": 3200000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }
JuLsez4R/Llama-turkish-lawbot
Mar 2025
0
15
{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }
apider/Llama-3.2-1B-Instruct-FineTome-100k
Mar 2025
0
70