From 721dcb2ebc3c6322579bf463371fa9c53077c368 Mon Sep 17 00:00:00 2001 From: mgoin Date: Wed, 9 Jul 2025 12:55:41 -0400 Subject: [PATCH] Change cmakelists Signed-off-by: mgoin --- CMakeLists.txt | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/CMakeLists.txt b/CMakeLists.txt index 0129f85123fb9..c13961b55dc54 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -171,6 +171,13 @@ if(NVCC_THREADS AND VLLM_GPU_LANG STREQUAL "CUDA") list(APPEND VLLM_GPU_FLAGS "--threads=${NVCC_THREADS}") endif() +# +# Set nvcc fatbin compression. +# +if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 12.8 AND VLLM_GPU_LANG STREQUAL "CUDA") + list(APPEND VLLM_GPU_FLAGS "-Xfatbin -compress-all -compress-mode=size") +endif() + # # Use FetchContent for C++ dependencies that are compiled as part of vLLM's build process.