mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 08:14:54 +08:00
[Misc] Fix Unable to detect current VLLM config. Defaulting to NHD kv cache layout warning (#20400)
Signed-off-by: NickLucche <nlucches@redhat.com>
This commit is contained in:
parent
78fe77534b
commit
8d775dd30a
@ -97,10 +97,10 @@ def get_kv_connector_cache_layout():
|
|||||||
# used for faster transfer.
|
# used for faster transfer.
|
||||||
vllm_config = get_current_vllm_config()
|
vllm_config = get_current_vllm_config()
|
||||||
kv_config = vllm_config.kv_transfer_config
|
kv_config = vllm_config.kv_transfer_config
|
||||||
if vllm_config.model_config is None or kv_config is None:
|
if kv_config is not None and vllm_config.model_config is None:
|
||||||
logger.warning_once("Unable to detect current VLLM config. " \
|
logger.warning_once("Unable to detect current VLLM config. " \
|
||||||
"Defaulting to NHD kv cache layout.")
|
"Defaulting to NHD kv cache layout.")
|
||||||
else:
|
elif kv_config is not None:
|
||||||
use_mla = vllm_config.model_config.use_mla
|
use_mla = vllm_config.model_config.use_mla
|
||||||
if not use_mla and kv_config.kv_connector == "NixlConnector":
|
if not use_mla and kv_config.kv_connector == "NixlConnector":
|
||||||
logger.info_once("NixlConnector detected. Setting KV cache " \
|
logger.info_once("NixlConnector detected. Setting KV cache " \
|
||||||
|
|||||||
@ -138,7 +138,7 @@ def get_kv_cache_layout():
|
|||||||
if cache_layout is None:
|
if cache_layout is None:
|
||||||
cache_layout = get_kv_connector_cache_layout()
|
cache_layout = get_kv_connector_cache_layout()
|
||||||
else:
|
else:
|
||||||
logger.info_once("`FLASHINFER_KV_CACHE_LAYOUT` environment variable " \
|
logger.info_once("`VLLM_KV_CACHE_LAYOUT` environment variable " \
|
||||||
"detected. Setting KV cache layout to %s.", cache_layout)
|
"detected. Setting KV cache layout to %s.", cache_layout)
|
||||||
|
|
||||||
return cache_layout
|
return cache_layout
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user