diff --git a/docs/mkdocs/hooks/generate_argparse.py b/docs/mkdocs/hooks/generate_argparse.py index 9bdb1a0bb2d11..d6d33fbf61ebb 100644 --- a/docs/mkdocs/hooks/generate_argparse.py +++ b/docs/mkdocs/hooks/generate_argparse.py @@ -92,7 +92,7 @@ def auto_mock(module_name: str, attr: str, max_mocks: int = 100): bench_latency = auto_mock("vllm.benchmarks", "latency") -bench_multimodal_processor = auto_mock("vllm.benchmarks", "multimodal_processor") +bench_mm_processor = auto_mock("vllm.benchmarks", "mm_processor") bench_serve = auto_mock("vllm.benchmarks", "serve") bench_sweep_plot = auto_mock("vllm.benchmarks.sweep.plot", "SweepPlotArgs") bench_sweep_plot_pareto = auto_mock( @@ -223,8 +223,8 @@ def on_startup(command: Literal["build", "gh-deploy", "serve"], dirty: bool): "run-batch": create_parser(openai_run_batch.make_arg_parser), # Benchmark CLI "bench_latency": create_parser(bench_latency.add_cli_args), - "bench_multimodal_processor": create_parser( - bench_multimodal_processor.add_cli_args + "bench_mm_processor": create_parser( + bench_mm_processor.add_cli_args ), "bench_serve": create_parser(bench_serve.add_cli_args), "bench_sweep_plot": create_parser(bench_sweep_plot.add_cli_args), diff --git a/vllm/config/observability.py b/vllm/config/observability.py index eb4c1482f35cf..64bd9852bd161 100644 --- a/vllm/config/observability.py +++ b/vllm/config/observability.py @@ -67,7 +67,7 @@ class ObservabilityConfig: enable_mm_processor_stats: bool = False """Enable collection of timing statistics for multimodal processor operations. This is for internal use only (e.g., benchmarks) and is not exposed as a CLI - argument. Defaults to `False` (disabled).""" + argument.""" @cached_property def collect_model_forward_time(self) -> bool: diff --git a/vllm/engine/arg_utils.py b/vllm/engine/arg_utils.py index 143849c3bc970..1051e0f66f6a8 100644 --- a/vllm/engine/arg_utils.py +++ b/vllm/engine/arg_utils.py @@ -1041,9 +1041,6 @@ class EngineArgs: "--enable-layerwise-nvtx-tracing", **observability_kwargs["enable_layerwise_nvtx_tracing"], ) - # Note: --enable-mm-processor-stats is intentionally not exposed as a CLI - # argument. It can be set programmatically via parser.set_defaults() for - # internal use (e.g., benchmarks), but is not part of the public API. # Scheduler arguments scheduler_kwargs = get_kwargs(SchedulerConfig) diff --git a/vllm/entrypoints/cli/benchmark/mm_processor.py b/vllm/entrypoints/cli/benchmark/mm_processor.py index e769bd69dc140..8f1799af12e59 100644 --- a/vllm/entrypoints/cli/benchmark/mm_processor.py +++ b/vllm/entrypoints/cli/benchmark/mm_processor.py @@ -2,7 +2,7 @@ # SPDX-FileCopyrightText: Copyright contributors to the vLLM project import argparse -from vllm.benchmarks.multimodal_processor import add_cli_args, main +from vllm.benchmarks.mm_processor import add_cli_args, main from vllm.entrypoints.cli.benchmark.base import BenchmarkSubcommandBase