Unverified Commit 8d775dd3 authored by Nicolò Lucchesi's avatar Nicolò Lucchesi Committed by GitHub
Browse files

[Misc] Fix `Unable to detect current VLLM config. Defaulting to NHD kv cache...


[Misc] Fix `Unable to detect current VLLM config. Defaulting to NHD kv cache layout` warning (#20400)
Signed-off-by: default avatarNickLucche <nlucches@redhat.com>
parent 78fe7753
...@@ -97,10 +97,10 @@ def get_kv_connector_cache_layout(): ...@@ -97,10 +97,10 @@ def get_kv_connector_cache_layout():
# used for faster transfer. # used for faster transfer.
vllm_config = get_current_vllm_config() vllm_config = get_current_vllm_config()
kv_config = vllm_config.kv_transfer_config kv_config = vllm_config.kv_transfer_config
if vllm_config.model_config is None or kv_config is None: if kv_config is not None and vllm_config.model_config is None:
logger.warning_once("Unable to detect current VLLM config. " \ logger.warning_once("Unable to detect current VLLM config. " \
"Defaulting to NHD kv cache layout.") "Defaulting to NHD kv cache layout.")
else: elif kv_config is not None:
use_mla = vllm_config.model_config.use_mla use_mla = vllm_config.model_config.use_mla
if not use_mla and kv_config.kv_connector == "NixlConnector": if not use_mla and kv_config.kv_connector == "NixlConnector":
logger.info_once("NixlConnector detected. Setting KV cache " \ logger.info_once("NixlConnector detected. Setting KV cache " \
......
...@@ -138,7 +138,7 @@ def get_kv_cache_layout(): ...@@ -138,7 +138,7 @@ def get_kv_cache_layout():
if cache_layout is None: if cache_layout is None:
cache_layout = get_kv_connector_cache_layout() cache_layout = get_kv_connector_cache_layout()
else: else:
logger.info_once("`FLASHINFER_KV_CACHE_LAYOUT` environment variable " \ logger.info_once("`VLLM_KV_CACHE_LAYOUT` environment variable " \
"detected. Setting KV cache layout to %s.", cache_layout) "detected. Setting KV cache layout to %s.", cache_layout)
return cache_layout return cache_layout
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment