[NIXL][Bugfix] Fix NIXL/RDMA registration failure over CuMemAllocator (#29569)

Signed-off-by: Somoku <linsh0@protonmail.com> Co-authored-by: Nicolò Lucchesi <nlucches@redhat.com>
2026-03-16 08:27:07 +08:00 · 2025-12-17 17:52:58 +08:00 · 2025-12-17 17:52:58 +08:00 · f4e884f222
commit f4e884f222
parent 3b1d440ede
1 changed files with 10 additions and 0 deletions
--- a/csrc/cumem_allocator.cpp
+++ b/csrc/cumem_allocator.cpp
@ -107,6 +107,16 @@ void create_and_map(unsigned long long device, ssize_t size, CUdeviceptr d_mem,
  prop.location.id = device;
  prop.allocFlags.compressionType = CU_MEM_ALLOCATION_COMP_NONE;

+#ifndef USE_ROCM
+  int flag = 0;
+  CUDA_CHECK(cuDeviceGetAttribute(
+      &flag, CU_DEVICE_ATTRIBUTE_GPU_DIRECT_RDMA_WITH_CUDA_VMM_SUPPORTED,
+      device));
+  if (flag) {  // support GPUDirect RDMA if possible
+    prop.allocFlags.gpuDirectRDMACapable = 1;
+  }
+#endif
+
 #ifndef USE_ROCM
  // Allocate memory using cuMemCreate
  CUDA_CHECK(cuMemCreate(p_memHandle, size, &prop, 0));