Models released in the week of Dec 8, 2024

{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

axel-datos/qwen2.5-0.5b-instruct_gsm8k_full-finetuningV2

Dec 2024

0

28

A

{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

axel-datos/qwen2.5-0.5b-instruct_MATH_full-finetuningV2

Dec 2024

0

28

A

{ "id": "mistral-nemo", "created_at": "1970-01-01T00:00:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 12, "parameter_size": 12000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "mistral", "family_name": "Mistral" }

redrix/patricide-12B-Unslop-Mell-v2

Dec 2024

34

31

R

{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

typhoon-ai/llama3.2-typhoon2-1b

Dec 2024

2

624

T

{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

typhoon-ai/llama3.2-typhoon2-1b-instruct

Dec 2024

5

673

T

{ "id": "llama32-3b", "created_at": "2025-06-12T19:26:12.601Z", "updated_at": "2026-03-10T07:21:03.452Z", "concurrency_cost": 1, "size": 3.2, "parameter_size": 3200000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

HuggingFaceTB/finemath-ablation-finemath-infimath-3plus

Dec 2024

0

9

H

{ "id": "gemma2-9b", "created_at": "2025-05-12T23:44:18.135Z", "updated_at": "2026-03-09T13:45:02.013Z", "concurrency_cost": 1, "size": 9, "parameter_size": 9000000000, "context_length": 16384, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": null, "family_name": null }

testmoto/gemma-2-9b-synthetic_coding

Dec 2024

2

322

T

{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

ZzWater/viitor-voice-mix

Dec 2024

5

15

Z

{ "id": "qwen25-7b", "created_at": "2025-06-12T09:08:32.442Z", "updated_at": "2026-03-09T13:58:41.753Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

prithivMLmods/QwQ-LCoT-7B-Instruct

Dec 2024

20

26

P

{ "id": "llama31-8b", "created_at": "2025-10-15T03:53:00.000Z", "updated_at": "2026-01-27T07:58:09.462Z", "concurrency_cost": 1, "size": 8, "parameter_size": 8000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama31", "family_name": "Llama 3.1" }

Lugha-Llama/Lugha-Llama-8B-wura_edu

Dec 2024

1

92

L

{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

axel-datos/Llama-3.2-1B_gsm8k_full-finetuning

Dec 2024

0

9

A

{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

axel-datos/qwen2.5-0.5b-instruct_gsm8k_full-finetuning

Dec 2024

0

29

A

{ "id": "qwen2-0b5", "created_at": "2025-06-12T09:08:31.736Z", "updated_at": "2026-03-10T07:28:44.065Z", "concurrency_cost": 1, "size": 0.5, "parameter_size": 500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

axel-datos/qwen2.5-0.5b-instruct_MATH_full-finetuning

Dec 2024

0

37

A

{ "id": "qwen2-1b5", "created_at": "2025-06-12T09:08:31.819Z", "updated_at": "2026-03-10T07:29:28.502Z", "concurrency_cost": 1, "size": 1.5, "parameter_size": 1500000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

thirdeyeai/Qwen2.5-1.5B-Instruct-uncensored

Dec 2024

2

1,626

T

{ "id": "gemma2-2b", "created_at": "2025-06-12T09:08:29.994Z", "updated_at": "2026-01-27T07:35:50.732Z", "concurrency_cost": 1, "size": 2.6, "parameter_size": 2600000000, "context_length": 8192, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "gemma2", "family_name": "Gemma 2" }

Efficient-Large-Model/gemma-2-2b-it

Dec 2024

3

122,445

E

{ "id": "qwen2-7b", "created_at": "2025-06-12T09:08:31.903Z", "updated_at": "2026-03-09T13:58:05.398Z", "concurrency_cost": 1, "size": 7.6, "parameter_size": 7600000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen2", "family_name": "Qwen 2" }

joaomsimoes/Newsie-Qwen-2.5-7b-Instruct

Dec 2024

0

31

J

{ "id": "llama32-1b", "created_at": "2025-06-12T19:26:12.362Z", "updated_at": "2026-03-10T07:19:26.530Z", "concurrency_cost": 1, "size": 1, "parameter_size": 1000000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "llama32", "family_name": "Llama 3.2" }

vietanh0802/llama-3.2-1B-IELTS-eval-finetuned-3-times

Dec 2024

0

8

V

{ "id": "qwen25-3b", "created_at": "2025-06-12T09:08:32.360Z", "updated_at": "2026-03-10T07:31:51.709Z", "concurrency_cost": 1, "size": 3.1, "parameter_size": 3100000000, "context_length": 32768, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": "qwen25", "family_name": "Qwen 2.5" }

prithivMLmods/QwQ-LCoT-3B-Instruct

Dec 2024

5

25

P

{ "id": "gemma2-9b", "created_at": "2025-05-12T23:44:18.135Z", "updated_at": "2026-03-09T13:45:02.013Z", "concurrency_cost": 1, "size": 9, "parameter_size": 9000000000, "context_length": 16384, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": null, "family_name": null }

themex1380/Gemma-2-9B-Uncensored

Dec 2024

2

6

T

{ "id": "gemma2-9b", "created_at": "2025-05-12T23:44:18.135Z", "updated_at": "2026-03-09T13:45:02.013Z", "concurrency_cost": 1, "size": 9, "parameter_size": 9000000000, "context_length": 16384, "is_moe": false, "active_parameters": null, "vision_supported": false, "input_modalities": [ "text" ], "output_modalities": [ "text" ], "family": null, "family_name": null }

themex1380/Gemma-2-9B-Chinese-Chat-Uncensored

Dec 2024

3

575

T

Model Releases

Week of Dec 8, 2024