Model Releases
Week of Jun 1, 2025
{ "id": "qwen3-4b", "created_at": "2025-06-12T09:08:32.996Z", "updated_at": "2026-03-10T07:24:18.754Z", "concurrency_cost": 1, "size": 4, "parameter_size": 4000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
Tesslate/UIGEN-T3-4B-Preview-MAX
Jun 2025
11
12
{ "id": "mistral-nemo", "created_at": "1970-01-01T00:00:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 12, "parameter_size": 12000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral", "family_name": "Mistral" }
Nitral-AI/Irixxed-Magcap-12B-Slerp
Jun 2025
30
55
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
ruberri/Qwen3-0.6B-m3-mcqa-reason-chat
Jun 2025
0
7
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
LLucass/TT_L0.2_H0.2_dr_grpo
Jun 2025
0
3
{ "id": "tinyllama-1b1", "created_at": "2025-06-12T09:08:30.540Z", "updated_at": "2026-03-10T07:33:26.434Z", "concurrency_cost": 1, "size": 1.1, "parameter_size": 1100000000, "context_length": 2048, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama2", "family_name": "Llama 2" }
zeras141a/newtest
Jun 2025
0
2
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
raphassaraf/MNLP_M3_rag_model_0shotNoCoT_S1_65k_1epoch
Jun 2025
0
2
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
shulijia/MNLP_M3_mcqa_model_base_mathqa_cot_orig
Jun 2025
0
4
{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
LLucass/TT_L0.2_H0.2_grpo
Jun 2025
0
2
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
vericava/qwen3-0.6b-vericava-posts-v4
Jun 2025
0
4
{ "id": "qwen25-1b5", "created_at": "2025-06-12T09:08:32.277Z", "updated_at": "2026-03-10T07:30:56.645Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
RoadQAQ/Qwen2.5-Math-1.5B-16k-think
Jun 2025
0
377
{ "id": "qwen2-7b", "created_at": "2025-06-12T09:08:31.903Z", "updated_at": "2026-03-09T13:58:05.398Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
RoadQAQ/Qwen2.5-Math-7B-16k-think
Jun 2025
0
52
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
TarhanE/sft-count_loss-Qwen3-0.6B-mle0.5-ul0.5-tox1.0-e4
Jun 2025
0
6
{ "id": "llama31-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }
sophosympatheia/StrawberryLemonade-L3-70B-v1.0
Jun 2025
23
15
{ "id": "mistral-24b", "created_at": "2025-12-02T14:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 24, "parameter_size": 24000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral3", "family_name": "Mistral 3" }
Aratako/MistralPrism-24B
Jun 2025
5
24
{ "id": "gemma3t-1b", "created_at": "2025-06-28T03:29:29.276Z", "updated_at": "2026-01-27T07:55:38.930Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma3", "family_name": "Gemma 3" }
VIDraft/Gemma-3-R1984-1B
Jun 2025
10
4
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
christinakopi/qwen_sft_model_stem
Jun 2025
0
2
{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }
Delta-Vector/Austral-70B-Preview
Jun 2025
3
8
{ "id": "qwen3-0b6", "created_at": "2025-06-12T09:08:32.830Z", "updated_at": "2026-03-10T07:32:21.140Z", "concurrency_cost": 1, "size": 0.8, "parameter_size": 800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen3", "family_name": "Qwen 3" }
christinakopi/qwen_dpo_stem-m1_pairs_lr3e-6_sft_BASE
Jun 2025
0
1
{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }
Alibaba-NLP/ZeroSearch_wiki_V2_Qwen2.5_3B_Instruct
Jun 2025
0
18
{ "id": "qwen2-7b", "created_at": "2025-06-12T09:08:31.903Z", "updated_at": "2026-03-09T13:58:05.398Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }
Alibaba-NLP/ZeroSearch_wiki_V2_Qwen2.5_7B_Instruct
Jun 2025
1
5