diff --git a/vllm/distributed/device_communicators/all2all.py b/vllm/distributed/device_communicators/all2all.py index c8c373b8adc9b..874147960bed7 100644 --- a/vllm/distributed/device_communicators/all2all.py +++ b/vllm/distributed/device_communicators/all2all.py @@ -143,6 +143,24 @@ class DeepEPAll2AllManagerBase(All2AllManagerBase): device = self.dp_group.device props = torch.cuda.get_device_properties(device) self.num_sms = props.multi_processor_count + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") + print(f"Setting num sms to {self.num_sms}") def get_handle(self, kwargs): raise NotImplementedError