Models

Warm

llama31-8b

meta-llama/Llama-3.1-8B-Instruct

5,203

10,682,398

M
Warm

llama31-8b

meta-llama/Meta-Llama-3.1-8B-Instruct

5,203

10,682,398

M
Warm

qwen3-0b6

Qwen/Qwen3-0.6B

930

8,579,434

Q
Warm

qwen25-3b

Qwen/Qwen2.5-3B-Instruct

357

7,486,416

Q
Warm

qwen25-7b

Qwen/Qwen2.5-7B-Instruct

991

5,985,599

Q
Warm

qwen25-1b5

Qwen/Qwen2.5-1.5B-Instruct

576

5,478,608

Q
Warm

qwen3-8b

Qwen/Qwen3-8B

835

4,368,556

Q
Warm

qwen25-0b5

Qwen/Qwen2.5-Coder-0.5B-Instruct

55

4,067,143

Q
Warm

qwen3-4b

Qwen/Qwen3-4B

512

3,827,678

Q
Warm

qwen3-4b

Qwen/Qwen3-4B-Instruct-2507

611

3,564,447

Q
Warm

qwen3-1b7

Qwen/Qwen3-1.7B

373

3,213,245

Q
Warm

llama32-1b

meta-llama/Llama-3.2-1B-Instruct

1,225

3,197,392

M
Warm

qwen25-14b

Qwen/Qwen2.5-14B-Instruct

297

2,971,441

Q
Warm

qwen25-32b

deepseek-ai/DeepSeek-R1-Distill-Qwen-32B

1,483

2,747,300

D
Warm

qwen25-32b

Qwen/Qwen2.5-32B-Instruct

315

2,624,866

Q
Warm

qwen25-1b5

deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B

1,420

2,585,477

D
Warm

mistral-v02-7b

mistralai/Mistral-7B-Instruct-v0.2

3,043

2,412,030

M
Warm

gemma3t-1b

google/gemma-3-1b-it

782

2,356,728

G
Warm

llama3-8b

meta-llama/Meta-Llama-3-8B

6,412

2,142,122

M
Warm

qwen25-0b5

Qwen/Qwen2.5-0.5B-Instruct

426

2,089,673

Q