diff --git a/tests/v1/kv_connector/unit/test_nixl_connector.py b/tests/v1/kv_connector/unit/test_nixl_connector.py index 3860d7c85724a..b185936ab025f 100644 --- a/tests/v1/kv_connector/unit/test_nixl_connector.py +++ b/tests/v1/kv_connector/unit/test_nixl_connector.py @@ -229,6 +229,9 @@ class FakeNixlConnectorWorker(NixlConnectorWorker): num_blocks=1, block_len=self.block_len, attn_backend_name=self.backend_name, + # `self.kv_cache_layout` is only forced to HND when vllm engine + # is started. We mock HND here. + kv_cache_layout="HND", ), remote_tp_size=remote_tp_size) return {0: remote_agent_name}