diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/utils.py b/vllm/model_executor/layers/quantization/compressed_tensors/utils.py index d700a0b15a81e..4ea79531efe7e 100644 --- a/vllm/model_executor/layers/quantization/compressed_tensors/utils.py +++ b/vllm/model_executor/layers/quantization/compressed_tensors/utils.py @@ -236,7 +236,7 @@ def _match_fused_layer(layer_name: str, for type_suffix in possible_layer_types) if is_same_parent and is_matching_type and all( - '.'.join([parent_path, type_suffix]) + (f"{parent_path}.{type_suffix}" in target_layers) for type_suffix in possible_layer_types): return target