Model Releases

{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

alpha-ai/qwen2.5-reason-thought-lite

Feb 2025

0

5

A

{ "id": "gemma2-2b", "created_at": "2025-06-12T09:08:29.994Z", "updated_at": "2026-01-27T07:35:50.732Z", "concurrency_cost": 1, "size": 2.6, "parameter_size": 2600000000, "context_length": 8192, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma2", "family_name": "Gemma 2" }

Ananya8154/Gemma-2-2B-Indian-Law

Feb 2025

4

14

A

{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }

Tarek07/Progenitor-V3.3-LLaMa-70B

Feb 2025

15

10

T

{ "id": "llama32-3b", "created_at": "2025-06-12T19:26:12.601Z", "updated_at": "2026-03-10T07:21:03.452Z", "concurrency_cost": 1, "size": 3.2, "parameter_size": 3200000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

TTahir/Llama3bv1

Feb 2025

0

7

T

{ "id": "mistral-24b", "created_at": "2025-12-02T14:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 24, "parameter_size": 24000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral3", "family_name": "Mistral 3" }

ArliAI/Mistral-Small-24B-ArliAI-RPMax-v1.4

Feb 2025

10

7

A

{ "id": "qwen25-7b", "created_at": "2025-06-12T09:08:32.442Z", "updated_at": "2026-03-09T13:58:41.753Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

mlfoundations-dev/difficulty_sorting_random_seed_code

Feb 2025

0

2

M

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

UW-Madison-Lee-Lab/Llama-PRM800K

Feb 2025

0

399

U

{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

BirendraSharma/llama3.2_1B_distractors_generation

Feb 2025

0

3

B

{ "id": "qwen25-32b", "created_at": "2025-06-12T09:08:32.600Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 2, "size": 32.8, "parameter_size": 32799999999.999996, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

simplescaling/s1.1-32B

Feb 2025

99

90

S

{ "id": "llama3-8b", "created_at": "2025-12-02T14:43:00.000Z", "updated_at": "2026-03-06T06:13:02.721Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 8192, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama3", "family_name": "Llama 3" }

SVECTOR-CORPORATION/Akshara-8B-Llama-Multilingual-V0.1

Feb 2025

13

36

S

{ "id": "mistral-nemo", "created_at": "1970-01-01T00:00:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 12, "parameter_size": 12000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral", "family_name": "Mistral" }

DoppelReflEx/MN-12B-FoxFrame-Miyuri

Feb 2025

4

13

D

{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

yasserrmd/Coder-GRPO-3B

Feb 2025

7

1,416

Y

{ "id": "qwen25-7b", "created_at": "2025-06-12T09:08:32.442Z", "updated_at": "2026-03-09T13:58:41.753Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

mlfoundations-dev/difficulty_sorting_easy_seed_math

Feb 2025

0

4

M

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

allenai/Llama-3.1-Tulu-3.1-8B

Feb 2025

39

6,784

A

{ "id": "mistral-nemo", "created_at": "1970-01-01T00:00:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 12, "parameter_size": 12000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral", "family_name": "Mistral" }

Delta-Vector/Archaeo-12B

Feb 2025

19

11

D

{ "id": "mistral-24b", "created_at": "2025-12-02T14:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 24, "parameter_size": 24000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral3", "family_name": "Mistral 3" }

OddTheGreat/Machina_24B.V2

Feb 2025

10

12

O

{ "id": "mistral-24b", "created_at": "2025-12-02T14:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 24, "parameter_size": 24000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral3", "family_name": "Mistral 3" }

arcee-ai/Arcee-Blitz

Feb 2025

79

29

A

{ "id": "qwen25-1b5", "created_at": "2025-06-12T09:08:32.277Z", "updated_at": "2026-03-10T07:30:56.645Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

MasterControlAIML/DeepSeek-R1-Qwen2.5-1.5b-SFT-R1-JSON-Unstructured-To-Structured

Feb 2025

11

97

M

{ "id": "mistral-24b", "created_at": "2025-12-02T14:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 24, "parameter_size": 24000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral3", "family_name": "Mistral 3" }

dphn/Dolphin3.0-R1-Mistral-24B

Feb 2025

214

557

D

{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

alamios/DeepSeek-R1-DRAFT-Qwen2.5-Coder-0.5B

Feb 2025

2

12

A