From 8026a335a135af2e53c7d89652863312d7a3c936 Mon Sep 17 00:00:00 2001
From: Richard Zou <zou3519@users.noreply.github.com>
Date: Fri, 1 Aug 2025 10:11:29 -0400
Subject: [PATCH] [BugFix] Update AttnFusionPass cache key (#21947)

Signed-off-by: Richard Zou <zou3519@gmail.com>
---
 vllm/compilation/fusion_attn.py   | 3 +++
 vllm/compilation/inductor_pass.py | 3 ++-
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/vllm/compilation/fusion_attn.py b/vllm/compilation/fusion_attn.py
index 79518b6f4f965..a40a8caf34a88 100644
--- a/vllm/compilation/fusion_attn.py
+++ b/vllm/compilation/fusion_attn.py
@@ -164,3 +164,6 @@ class AttnFusionPass(VllmInductorPass):
         logger.debug("Fused quantization onto %s attention nodes", count)
         self.dump_graph(graph, "after_attn_fusion")
         self.end_and_log()
+
+    def uuid(self):
+        return VllmInductorPass.hash_source(self, AttentionStaticQuantPattern)
diff --git a/vllm/compilation/inductor_pass.py b/vllm/compilation/inductor_pass.py
index 810d0801e9f38..2a149c65b3877 100644
--- a/vllm/compilation/inductor_pass.py
+++ b/vllm/compilation/inductor_pass.py
@@ -76,9 +76,10 @@ class InductorPass(CustomGraphPass):
         for src in srcs:
             if isinstance(src, str):
                 src_str = src
-            elif isinstance(src, types.FunctionType):
+            elif isinstance(src, (types.FunctionType, type)):
                 src_str = inspect.getsource(src)
             else:
+                # object instance
                 src_str = inspect.getsource(src.__class__)
             hasher.update(src_str.encode("utf-8"))
         return hasher.hexdigest()