Models released in the week of Feb 9, 2025

{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

Emilio407/Dolphin3.0-Qwen2.5-0.5B-GRPO-V1

Feb 2025

0

162

E

{ "id": "llama3-8b", "created_at": "2025-12-02T14:43:00.000Z", "updated_at": "2026-03-06T06:13:02.721Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 8192, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama3", "family_name": "Llama 3" }

Sakuna/RAGent_gen

Feb 2025

0

164

S

{ "id": "llama32-3b", "created_at": "2025-06-12T19:26:12.601Z", "updated_at": "2026-03-10T07:21:03.452Z", "concurrency_cost": 1, "size": 3.2, "parameter_size": 3200000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

NousResearch/DeepHermes-3-Llama-3-3B-Preview

Feb 2025

39

206

N

{ "id": "qwen2-7b", "created_at": "2025-06-12T09:08:31.903Z", "updated_at": "2026-03-09T13:58:05.398Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

GAIR/LIMR

Feb 2025

7

219

G

{ "id": "mistral-nemo", "created_at": "1970-01-01T00:00:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 12, "parameter_size": 12000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral", "family_name": "Mistral" }

allura-org/Bigger-Body-12b

Feb 2025

12

66

A

{ "id": "qwen25-7b", "created_at": "2025-06-12T09:08:32.442Z", "updated_at": "2026-03-09T13:58:41.753Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

Vikhrmodels/Qwen2.5-7B-Instruct-Tool-Planning-v0.1

Feb 2025

14

35

V

{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

AbleCredit/AbleCredit-R0-Qwen-2.5-3B-Instruct

Feb 2025

1

46

A

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

trendmicro-ailab/Llama-Primus-Merged

Feb 2025

14

88

T

{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }

Nexesenex/Llama_3.x_70b_Evasion_V1

Feb 2025

1

21

N

{ "id": "mistral-24b", "created_at": "2025-12-02T14:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 2, "size": 24, "parameter_size": 24000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral3", "family_name": "Mistral 3" }

yentinglin/Mistral-Small-24B-Instruct-2501-reasoning

Feb 2025

59

30

Y

{ "id": "qwen25-0b5", "created_at": "2025-06-12T09:08:32.202Z", "updated_at": "2026-03-10T07:30:16.141Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

thesantatitan/Qwen2-0.5B-svg-SFT

Feb 2025

1

12

T

{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

unsloth/DeepScaleR-1.5B-Preview

Feb 2025

3

32

U

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

unsloth/Llama-3.1-8B

Feb 2025

6

3,299

U

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

unsloth/Llama-3.1-8B-Instruct

Feb 2025

13

314,278

U

{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }

Steelskull/L3.3-Cu-Mai-R1-70b

Feb 2025

25

151

S

{ "id": "llama3-8b", "created_at": "2025-12-02T14:43:00.000Z", "updated_at": "2026-03-06T06:13:02.721Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 8192, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama3", "family_name": "Llama 3" }

lapisrocks/Llama-3-8B-Instruct-TAR-Cyber

Feb 2025

0

52

L

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

develops20/DeepSeek-R1-Distill-Llama-8B-Medical-COT

Feb 2025

1

50

D

{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }

LatitudeGames/Wayfarer-Large-70B-Llama-3.3

Feb 2025

95

52

L

{ "id": "qwen25-7b", "created_at": "2025-06-12T09:08:32.442Z", "updated_at": "2026-03-09T13:58:41.753Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

WiroAI/OpenR1-Qwen-7B-Turkish

Feb 2025

23

22

W

{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

huihui-ai/DeepScaleR-1.5B-Preview-abliterated

Feb 2025

6

29

H

Model Releases

Week of Feb 9, 2025