Model Releases
Week of Jun 1, 2025
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
Tesslate/UIGEN-T3-4B-Preview-MAX
Jun 2025
10
10
{ "id": "mistral-nemo", "created_at": "1970-01-01T00:00:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 12, "parameter_size": 12000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral", "family_name": "Mistral" }
Nitral-AI/Irixxed-Magcap-12B-Slerp
Jun 2025
30
26
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
ruberri/Qwen3-0.6B-m3-mcqa-reason-chat
Jun 2025
0
3
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
LLucass/TT_L0.2_H0.2_dr_grpo
Jun 2025
0
2
{ "id": "tinyllama-1b1", "created_at": "2025-06-12T09:08:30.540Z", "updated_at": "2026-03-10T07:33:26.434Z", "concurrency_cost": 1, "size": 1.1, "parameter_size": 1100000000, "context_length": 2048, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }
zeras141a/newtest
Jun 2025
0
25
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
raphassaraf/MNLP_M3_rag_model_0shotNoCoT_S1_65k_1epoch
Jun 2025
0
2
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
shulijia/MNLP_M3_mcqa_model_base_mathqa_cot_orig
Jun 2025
0
15
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
LLucass/TT_L0.2_H0.2_grpo
Jun 2025
0
15
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
vericava/qwen3-0.6b-vericava-posts-v4
Jun 2025
0
16
{ "id": "qwen25-1b5", "created_at": "2025-06-12T09:08:32.277Z", "updated_at": "2026-03-10T07:30:56.645Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
RoadQAQ/Qwen2.5-Math-1.5B-16k-think
Jun 2025
0
2,048
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
TarhanE/sft-count_loss-Qwen3-0.6B-mle0.5-ul0.5-tox1.0-e4
Jun 2025
0
1
{ "id": "llama31-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }
sophosympatheia/StrawberryLemonade-L3-70B-v1.0
Jun 2025
23
13
{ "id": "mistral-24b", "created_at": "2025-12-02T14:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 24, "parameter_size": 24000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral3", "family_name": "Mistral 3" }
Aratako/MistralPrism-24B
Jun 2025
5
82
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
christinakopi/qwen_sft_model_stem
Jun 2025
0
49
{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }
Delta-Vector/Austral-70B-Preview
Jun 2025
3
9
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
christinakopi/qwen_dpo_stem-m1_pairs_lr3e-6_sft_BASE
Jun 2025
0
9
{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
zx123566/Qwen2.5-0.5B-Instruct-Gensyn-Swarm-scurrying_stalking_anaconda
Jun 2025
0
1
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
Allen-UQ/Qwen2.5-1.5B-Instruct-SFT-2-Hop-Nei-Aug-Pubmed
Jun 2025
0
196
{ "id": "qwen3-1b7", "created_at": "2025-06-12T09:08:32.913Z", "updated_at": "2026-03-10T07:32:52.904Z", "concurrency_cost": 1, "size": 2, "parameter_size": 2000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
btrabucco/Insta-Qwen3-1.7B-SFT
Jun 2025
0
304
{ "id": "qwen3-8b", "created_at": "2025-05-12T23:45:01.939Z", "updated_at": "2026-01-27T08:03:30.655Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
willcb/Qwen3-8B
Jun 2025
2
2,422