Address PR feedback: simplify comments, remove extra assertion, and improve docstrings

Co-authored-by: ProExpertProg <11367180+ProExpertProg@users.noreply.github.com>
2026-05-24 03:37:54 +08:00 · 2025-08-21 22:26:09 +00:00 · 2025-08-21 22:26:09 +00:00 · 91735e9c1c
commit 91735e9c1c
parent 865b0bfafd
4 changed files with 5 additions and 17 deletions
--- a/tests/compile/piecewise/test_multiple_graphs.py
+++ b/tests/compile/piecewise/test_multiple_graphs.py
@ -16,8 +16,7 @@ from vllm.config import (CompilationConfig, CompilationLevel, VllmConfig,
 from vllm.envs import VLLM_USE_V1
 from vllm.forward_context import set_forward_context
-# Import shared test operations
+# This import automatically registers torch ops for testing (like silly.attention)
 # The standard attention operation is automatically registered when imported
 import tests.compile.test_operations
 BATCH_SIZE = 32
@ -320,9 +319,5 @@ def test_multi_graph_piecewise_compile_outputs_equal():
    ):
        outputs.append(run_model(vllm_config, model, inputs))
    # Generally don't expect outputs with and without inductor
    # to be bitwise equivalent
    assert torch.allclose(outputs[0], outputs[1])
    # Expect bitwise equivalence using inductor w/ and w/o cudagraph
    assert torch.equal(outputs[0], outputs[2])
--- a/tests/compile/piecewise/test_simple.py
+++ b/tests/compile/piecewise/test_simple.py
@ -15,7 +15,7 @@ from vllm.config import (CompilationConfig, CompilationLevel, CUDAGraphMode,
 from vllm.envs import VLLM_USE_V1
 from vllm.forward_context import BatchDescriptor, set_forward_context
-# Import shared test operations  
+# This import also automatically registers torch ops for testing (like silly.attention)
 from tests.compile.test_operations import (
    get_global_counter, reset_global_counter
 )
--- a/tests/compile/piecewise/test_toy_llama.py
+++ b/tests/compile/piecewise/test_toy_llama.py
@ -470,4 +470,4 @@ def benchmark():
 if __name__ == "__main__":
-    benchmark()
+    pass
--- a/tests/compile/test_operations.py
+++ b/tests/compile/test_operations.py
@ -3,14 +3,7 @@
 """
 Shared PyTorch custom operations for compilation tests.
-This module provides a centralized place to define and register custom
+Centralizes custom operation definitions to avoid duplicate registrations.
 PyTorch operations used across multiple compilation tests. This avoids
 duplicate operation registrations that would cause RuntimeErrors when
 running tests together.
 The main "attention" operation is automatically registered when this module
 is imported. Individual test files can access the global counter functionality
 through helper functions.
 """
 import torch
@ -23,7 +16,7 @@ from vllm.utils import direct_register_custom_op
 silly_lib = Library("silly", "FRAGMENT")
-# Global counter that all tests can use or ignore
+# Global counter that counts the number of times attention is invoked
 _global_counter = 0
`@ -470,4 +470,4 @@ def benchmark():`


	`if __name__ == "__main__":`	`if __name__ == "__main__":`
	`benchmark()`	`pass`