diff --git a/vllm/config.py b/vllm/config.py index a5512c657e03..db4398addae3 100644 --- a/vllm/config.py +++ b/vllm/config.py @@ -353,7 +353,8 @@ class CacheConfig: elif self.cache_dtype == "fp8": if not is_hip(): nvcc_cuda_version = get_nvcc_cuda_version() - if nvcc_cuda_version < Version("11.8"): + if nvcc_cuda_version is not None \ + and nvcc_cuda_version < Version("11.8"): raise ValueError( "FP8 is not supported when cuda version is" "lower than 11.8.")