diff --git a/vllm/v1/engine/utils.py b/vllm/v1/engine/utils.py index c0ec5c740312e..97d5c939a2853 100644 --- a/vllm/v1/engine/utils.py +++ b/vllm/v1/engine/utils.py @@ -555,8 +555,6 @@ def launch_core_engines( # sends requests only to colocated engines. client_local_only = offline_mode or external_dp_lb or (local_engine_count == dp_size) - # HACK: handle case with one pod per node. - client_local_only = True # Set up input and output addresses. addresses = EngineZmqAddresses(