Models

Warm

qwen25-3b

Qwen/Qwen2.5-3B-Instruct

345

9,736,189

Q
Warm

qwen3-0b6

Qwen/Qwen3-0.6B

866

7,556,100

Q
Warm

qwen25-7b

Qwen/Qwen2.5-7B-Instruct

939

6,871,836

Q
Warm

llama31-8b

meta-llama/Meta-Llama-3.1-8B-Instruct

5,118

5,990,330

M
Warm

llama31-8b

meta-llama/Llama-3.1-8B-Instruct

5,118

5,990,330

M
Warm

qwen3-4b

Qwen/Qwen3-4B-Instruct-2507

546

5,861,856

Q
Warm

qwen25-0b5

Qwen/Qwen2.5-Coder-0.5B-Instruct

54

5,722,977

Q
Warm

qwen25-1b5

Qwen/Qwen2.5-1.5B-Instruct

565

5,669,092

Q
Warm

qwen3-8b

Qwen/Qwen3-8B

800

4,687,314

Q
Warm

qwen3-32b

Qwen/Qwen3-32B

598

4,255,998

Q
Warm

qwen3-1b7

Qwen/Qwen3-1.7B

352

4,224,392

Q
Warm

mistral-v02-7b

mistralai/Mistral-7B-Instruct-v0.2

3,033

3,476,632

M
Warm

llama32-1b

meta-llama/Llama-3.2-1B-Instruct

1,197

3,446,266

M
Warm

llama32-1b

meta-llama/Llama-3.2-1B

2,211

3,183,315

M
Warm

qwen3-4b

Qwen/Qwen3-4B

488

3,007,362

Q
Warm

qwen25-1b5

deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B

1,405

2,631,589

D
Warm

gemma3t-1b

google/gemma-3-1b-it

745

2,468,157

G
Warm

qwen25-32b

deepseek-ai/DeepSeek-R1-Distill-Qwen-32B

1,473

2,457,444

D
Warm

qwen25-0b5

Qwen/Qwen2.5-0.5B-Instruct

407

2,249,777

Q
Warm

llama3-8b

meta-llama/Meta-Llama-3-8B

6,400

2,075,358

M