Models

Warm

llama31-8b

meta-llama/Llama-3.1-8B-Instruct

5,248

11,955,861

M
Warm

llama31-8b

meta-llama/Meta-Llama-3.1-8B-Instruct

5,248

11,955,861

M
Warm

qwen25-3b

Qwen/Qwen2.5-3B-Instruct

363

10,554,542

Q
Warm

qwen3-0b6

Qwen/Qwen3-0.6B

964

7,920,303

Q
Warm

qwen25-7b

Qwen/Qwen2.5-7B-Instruct

1,005

6,021,121

Q
Warm

qwen25-1b5

Qwen/Qwen2.5-1.5B-Instruct

582

5,656,233

Q
Warm

qwen25-14b

Qwen/Qwen2.5-14B-Instruct

298

3,899,304

Q
Warm

qwen3-8b

Qwen/Qwen3-8B

851

3,778,670

Q
Warm

qwen3-1b7

Qwen/Qwen3-1.7B

379

3,733,540

Q
Warm

qwen3-4b

Qwen/Qwen3-4B

517

3,727,090

Q
Warm

qwen25-32b

Qwen/Qwen2.5-32B-Instruct

317

3,383,863

Q
Warm

qwen25-0b5

Qwen/Qwen2.5-Coder-0.5B-Instruct

58

3,081,474

Q
Warm

llama32-1b

meta-llama/Llama-3.2-1B-Instruct

1,234

2,772,164

M
Warm

qwen25-32b

deepseek-ai/DeepSeek-R1-Distill-Qwen-32B

1,488

2,383,318

D
Warm

llama31-8b

meta-llama/Llama-3.1-8B

2,014

2,344,936

M
Warm

llama31-8b

meta-llama/Meta-Llama-3.1-8B

2,014

2,344,936

M
Warm

gemma3t-1b

google/gemma-3-1b-it

793

2,333,012

G
Warm

mistral-v02-7b

mistralai/Mistral-7B-Instruct-v0.2

3,049

2,201,199

M
Warm

qwen3-4b

Qwen/Qwen3-4B-Instruct-2507

628

2,179,555

Q
Warm

qwen25-0b5

Qwen/Qwen2.5-0.5B-Instruct

436

1,825,157

Q