test_throughput_cli.py 628 Bytes
Newer Older
1
2
3
# SPDX-License-Identifier: Apache-2.0
import subprocess

4
import os
5
6
import pytest

7
8
9
from ..utils import  models_path_prefix

MODEL_NAME = os.path.join(models_path_prefix, "meta-llama/Llama-3.2-1B-Instruct")
10
11
12
13
14
15
16
17
18
19
20
21


@pytest.mark.benchmark
def test_bench_throughput():
    command = [
        "vllm", "bench", "throughput", "--model", MODEL_NAME, "--input-len",
        "32", "--output-len", "1", "--enforce-eager", "--load-format", "dummy"
    ]
    result = subprocess.run(command, capture_output=True, text=True)
    print(result.stdout)
    print(result.stderr)

22
    assert result.returncode == 0, f"Benchmark failed: {result.stderr}"