kv_transfer_state.py 2.22 KB
Newer Older
1
# SPDX-License-Identifier: Apache-2.0
2
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
3
from typing import TYPE_CHECKING
4
5

from vllm.distributed.kv_transfer.kv_connector.base import KVConnectorBaseType
6
7
8
9
10
from vllm.distributed.kv_transfer.kv_connector.factory import KVConnectorFactory
from vllm.distributed.kv_transfer.kv_connector.v1 import (
    KVConnectorBase_V1,
    KVConnectorRole,
)
11
12
13

if TYPE_CHECKING:
    from vllm.config import VllmConfig
14
    from vllm.v1.kv_cache_interface import KVCacheConfig
15

16
_KV_CONNECTOR_AGENT: KVConnectorBaseType | None = None
17
18
19
20


def get_kv_transfer_group() -> KVConnectorBaseType:
    assert _KV_CONNECTOR_AGENT is not None, (
21
22
        "disaggregated KV cache transfer parallel group is not initialized"
    )
23
24
25
26
27
28
29
    return _KV_CONNECTOR_AGENT


def has_kv_transfer_group() -> bool:
    return _KV_CONNECTOR_AGENT is not None


30
def is_v1_kv_transfer_group(connector: KVConnectorBaseType | None = None) -> bool:
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
    """Check if the KV connector is the v1 connector.
    If the argument is None, it will check the global KV connector

    Args:
        connector: The KV connector to check. If None, it will check the
            global KV connector.

    Note:
        This function will no-longer be needed after the v1 KV connector
        becomes the default.
    """
    if connector is None:
        connector = _KV_CONNECTOR_AGENT

    if connector is None:
        return False

    return isinstance(connector, KVConnectorBase_V1)


51
def ensure_kv_transfer_initialized(
52
    vllm_config: "VllmConfig", kv_cache_config: "KVCacheConfig | None" = None
53
) -> None:
54
55
56
57
58
59
60
61
62
    """
    Initialize KV cache transfer parallel group.
    """

    global _KV_CONNECTOR_AGENT

    if vllm_config.kv_transfer_config is None:
        return

63
64
65
66
    if (
        vllm_config.kv_transfer_config.is_kv_transfer_instance
        and _KV_CONNECTOR_AGENT is None
    ):
67
68
69
70
71
        _KV_CONNECTOR_AGENT = KVConnectorFactory.create_connector(
            config=vllm_config,
            role=KVConnectorRole.WORKER,
            kv_cache_config=kv_cache_config,
        )
72
73
74
75
76
77
78


def ensure_kv_transfer_shutdown() -> None:
    global _KV_CONNECTOR_AGENT
    if _KV_CONNECTOR_AGENT is not None:
        _KV_CONNECTOR_AGENT.shutdown()
        _KV_CONNECTOR_AGENT = None