conftest.py 1.2 KB
Newer Older
1
2
import pytest
import pytest_asyncio
zhuwenwen's avatar
zhuwenwen committed
3
# from huggingface_hub import snapshot_download
4
5

from tests.utils import RemoteOpenAIServer
6
from vllm.platforms import current_platform
7
8
9
10
11
12
13
14

from .utils import ARGS, CONFIGS, ServerConfig


# for each server config, download the model and return the config
@pytest.fixture(scope="session", params=CONFIGS.keys())
def server_config(request):
    config = CONFIGS[request.param]
15
16
17
18
19

    if current_platform.is_rocm() and not config.get("supports_rocm", True):
        pytest.skip("The {} model can't be tested on the ROCm platform".format(
            config["model"]))

20
    # download model and tokenizer using transformers
zhuwenwen's avatar
zhuwenwen committed
21
    # snapshot_download(config["model"])
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
    yield CONFIGS[request.param]


# run this for each server config
@pytest.fixture(scope="session")
def server(request, server_config: ServerConfig):
    model = server_config["model"]
    args_for_model = server_config["arguments"]
    with RemoteOpenAIServer(model, ARGS + args_for_model,
                            max_wait_seconds=480) as server:
        yield server


@pytest_asyncio.fixture
async def client(server: RemoteOpenAIServer):
    async with server.get_async_client() as async_client:
        yield async_client