diff --git a/vllm/model_executor/layers/fused_moe/fused_moe.py b/vllm/model_executor/layers/fused_moe/fused_moe.py index b7415148d812..7ad3ce1397b3 100644 --- a/vllm/model_executor/layers/fused_moe/fused_moe.py +++ b/vllm/model_executor/layers/fused_moe/fused_moe.py @@ -819,8 +819,8 @@ def get_config_file_name( ) -> str: device_name = current_platform.get_device_name().replace(" ", "_") # Set device_name to H200 if a device from the H200 family is detected - if "H200" in device_name: - device_name = "H200" + if "H200" in device_name.split("_"): + device_name = "NVIDIA_H200" dtype_selector = "" if not dtype else f",dtype={dtype}" block_shape_selector = ( "" if not block_shape or not all(block_shape) else f",block_shape={block_shape}"