Model Releases
Week of May 18, 2025
{ "id": "gemma3-4b", "created_at": "2025-06-28T03:29:29.931Z", "updated_at": "2026-01-27T08:00:33.028Z", "concurrency_cost": 1, "size": 4.3, "parameter_size": 4300000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": true, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma3", "family_name": "Gemma 3" }
CEIA-UFG/Gemma-3-Gaia-PT-BR-4b-it
May 2025
151
1,881
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
SpiceRL/DRA-GRPO
May 2025
1
3
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
SpiceRL/DRA-DR.GRPO
May 2025
1
3
{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }
open-unlearning/unlearn_tofu_Llama-3.2-1B-Instruct_forget10_SimNPO_lr5e-05_b3.5_a1_d1_g0.25_ep5
May 2025
0
139
{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }
open-unlearning/unlearn_tofu_Llama-3.2-1B-Instruct_forget10_SimNPO_lr2e-05_b4.5_a1_d0_g0.125_ep10
May 2025
0
55
{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }
open-unlearning/unlearn_tofu_Llama-3.2-1B-Instruct_forget10_SimNPO_lr2e-05_b3.5_a1_d1_g0.125_ep5
May 2025
0
12
{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }
open-unlearning/unlearn_tofu_Llama-3.2-1B-Instruct_forget10_SimNPO_lr2e-05_b3.5_a1_d1_g0.125_ep10
May 2025
0
5
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
PirxTion/qwen3-dpo-tulu
May 2025
0
18
{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
Papaperez/Qwen2.5-0.5B-Instruct-Gensyn-Swarm-lanky_reptilian_opossum
May 2025
0
67
{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
Jeremmmyyyyy/Qwen-poetry-logprob-no-norm-v3
May 2025
0
63
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
andresnowak/Qwen3-0.6B-instruction-finetuned
May 2025
0
130
{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
ryzax/1.5B-v18
May 2025
0
60
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
Qwen/Qwen3-4B-MLX-bf16
May 2025
5
162
{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
Qwen/Qwen3-8B-MLX-bf16
May 2025
8
153
{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
Qwen/Qwen3-1.7B-MLX-bf16
May 2025
6
270
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
Qwen/Qwen3-0.6B-MLX-bf16
May 2025
6
220
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
MichelleOdnert/MNLP_M2_mcqa_model
May 2025
0
7
{ "id": "qwen2-32b", "created_at": "2024-08-01T18:28:28.559Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 32, "parameter_size": 32000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
Tongyi-Zhiwen/QwenLong-L1-32B
May 2025
167
382
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
EmergentMethods/Qwen3-4B-BiasExpert
May 2025
10
15
{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
willcb/Qwen2.5-0.5B-Reverse-SFT
May 2025
0
10