Models released in the week of Mar 2, 2025

{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

Creekside/Qwen-3B-gsm8k-GRPO

Mar 2025

1

79

C

{ "id": "gemma2-9b", "created_at": "2025-05-12T23:44:18.135Z", "updated_at": "2026-03-09T13:45:02.013Z", "concurrency_cost": 1, "size": 9, "parameter_size": 9000000000, "context_length": 16384, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": null, "family_name": null }

tokyotech-llm/Gemma-2-Llama-Swallow-9b-pt-v0.1

Mar 2025

1

12,912

T

{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

AlbertShu/Qwen2-1.5B-gsm8k

Mar 2025

0

23

A

{ "id": "qwen25-14b", "created_at": "2025-06-12T09:08:32.518Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 1, "size": 14.8, "parameter_size": 14800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

JungZoona/T3Q-qwen2.5-14b-v1.0-e3

Mar 2025

57

146

J

{ "id": "qwen25-7b", "created_at": "2025-06-12T09:08:32.442Z", "updated_at": "2026-03-09T13:58:41.753Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

simplescaling/s1.1-7B

Mar 2025

6

29

S

{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

Xtra-Computing/XtraGPT-1.5B

Mar 2025

3

36

X

{ "id": "llama32-3b", "created_at": "2025-06-12T19:26:12.601Z", "updated_at": "2026-03-10T07:21:03.452Z", "concurrency_cost": 1, "size": 3.2, "parameter_size": 3200000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

Xtra-Computing/XtraGPT-3B

Mar 2025

3

13

X

{ "id": "qwen25-14b", "created_at": "2025-06-12T09:08:32.518Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 1, "size": 14.8, "parameter_size": 14800000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

simplescaling/s1.1-14B

Mar 2025

4

11

S

{ "id": "gemma2-2b", "created_at": "2025-06-12T09:08:29.994Z", "updated_at": "2026-01-27T07:35:50.732Z", "concurrency_cost": 1, "size": 2.6, "parameter_size": 2600000000, "context_length": 8192, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma2", "family_name": "Gemma 2" }

mshojaei77/gemma-2-2b-fa-v2

Mar 2025

4

34

M

{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

BanglaLLM/Bangla-s1k-qwen-2.5-3B-Instruct

Mar 2025

2

168

B

{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }

Tarek07/Dungeonmaster-V2.4-Expanded-LLaMa-70B

Mar 2025

12

15

T

{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

apider/Llama-3.2-1B-Instruct-FineTome-100k

Mar 2025

0

7

A

{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

tinycompany/SigmaBoi-bge-m3

Mar 2025

0

10

T

{ "id": "qwen25-32b", "created_at": "2025-06-12T09:08:32.600Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 2, "size": 32.8, "parameter_size": 32799999999.999996, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

trashpanda-org/QwQ-32B-Snowdrop-v0

Mar 2025

103

59

T

{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

jtatman/llama-3.2-1b-lewd-mental-occult

Mar 2025

3

11

J

{ "id": "llama33-70b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:36:45.252Z", "concurrency_cost": 4, "size": 70, "parameter_size": 70000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama33", "family_name": "Llama 3.3" }

Tarek07/Dungeonmaster-V2.2-Expanded-LLaMa-70B

Mar 2025

16

34

T

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

ccibeekeoc42/Llama-3.2-8B-Instruct-bnb-4bit_merged_16bit_finetune_2025-03-07

Mar 2025

0

6

C

{ "id": "qwen25-32b", "created_at": "2025-06-12T09:08:32.600Z", "updated_at": "2026-01-27T07:58:09.463Z", "concurrency_cost": 2, "size": 32.8, "parameter_size": 32799999999.999996, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

huihui-ai/QwQ-32B-abliterated

Mar 2025

108

142

H

{ "id": "qwen2-7b", "created_at": "2025-06-12T09:08:31.903Z", "updated_at": "2026-03-09T13:58:05.398Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

Trendyol/Trendyol-LLM-7B-chat-v4.1.0

Mar 2025

37

294

T

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

kehanlu/llama-3.2-8B-Instruct

Mar 2025

2

32

K

Model Releases

Week of Mar 2, 2025