[Doc]: fix various typos in multiple files (#23179)

Signed-off-by: Didier Durand <durand.didier@gmail.com>
2025-12-21 14:55:45 +08:00 · 2025-08-22 19:38:46 +02:00 · 2025-08-22 19:38:46 +02:00 · 22cf679aad
commit 22cf679aad
parent b6d7d34fc6
7 changed files with 12 additions and 12 deletions
--- a/vllm/beam_search.py
+++ b/vllm/beam_search.py
@ -18,7 +18,7 @@ class BeamSearchSequence:
    The text field is optional and will only be filled when the sequence is
    about to be returned to the user.
    """
-    # The tokens includes the prompt.
+    # The tokens include the prompt.
    tokens: list[int]
    logprobs: list[dict[int, Logprob]]
    lora_request: Optional[LoRARequest] = None
--- a/vllm/compilation/backends.py
+++ b/vllm/compilation/backends.py
@ -484,7 +484,7 @@ class VllmBackend:
            factors = []
            # 0. factors come from the env, for example, The values of
-            # VLLM_PP_LAYER_PARTITION will affects the computation graph.
+            # VLLM_PP_LAYER_PARTITION will affect the computation graph.
            env_hash = envs.compute_hash()
            factors.append(env_hash)
--- a/vllm/engine/arg_utils.py
+++ b/vllm/engine/arg_utils.py
@ -605,7 +605,7 @@ class EngineArgs:
            **guided_decoding_kwargs["disable_additional_properties"])
        guided_decoding_group.add_argument(
            "--reasoning-parser",
-            # This choices is a special case because it's not static
+            # This choice is a special case because it's not static
            choices=list(ReasoningParserManager.reasoning_parsers),
            **guided_decoding_kwargs["reasoning_backend"])
@ -1047,7 +1047,7 @@ class EngineArgs:
            # details from the config directly
            # no user input required / expected
            if isinstance(hf_config, SpeculatorsConfig):
-                # We create one since we dont create one
+                # We create one since we don't create one
                self.speculative_config = {}
                self.speculative_config[
                    "num_speculative_tokens"] = hf_config.num_lookahead_tokens
@ -1775,7 +1775,7 @@ class AsyncEngineArgs(EngineArgs):
    def add_cli_args(parser: FlexibleArgumentParser,
                     async_args_only: bool = False) -> FlexibleArgumentParser:
        # Initialize plugin to update the parser, for example, The plugin may
-        # adding a new kind of quantization method to --quantization argument or
+        # add a new kind of quantization method to --quantization argument or
        # a new device to --device argument.
        load_general_plugins()
        if not async_args_only:
--- a/vllm/engine/multiprocessing/client.py
+++ b/vllm/engine/multiprocessing/client.py
@ -539,7 +539,7 @@ class MQLLMEngineClient(EngineClient):
        if request_id in self.output_queues:
            raise ValueError(f"Request {request_id} already exists")
-        # 1) Create output queue for this requests.
+        # 1) Create output queue for this request.
        queue: asyncio.Queue[Union[RequestOutput,
                                   BaseException]] = asyncio.Queue()
        self.output_queues[request_id] = queue
@ -651,7 +651,7 @@ class MQLLMEngineClient(EngineClient):
        # Uses the same I/O as generate requests
        request = RPCLoadAdapterRequest(lora_request)
-        # Create output queue for this requests.
+        # Create output queue for this request.
        queue: asyncio.Queue[Union[None, BaseException]] = asyncio.Queue()
        self.output_queues[request.request_id] = queue
--- a/vllm/entrypoints/chat_utils.py
+++ b/vllm/entrypoints/chat_utils.py
@ -1330,7 +1330,7 @@ def apply_mistral_chat_template(
    # mistral-common uses assert statements to stop processing of input
    # if input does not comply with the expected format.
    # We convert those assertion errors to ValueErrors so they can be
-    # are properly caught in the preprocessing_input step
+    # properly caught in the preprocessing_input step
    except (AssertionError, MistralCommonException) as e:
        raise ValueError(str(e)) from e
--- a/vllm/utils/init.py
+++ b/vllm/utils/init.py
@ -2482,7 +2482,7 @@ class PlaceholderModule(_PlaceholderBase):
    A placeholder object to use when a module does not exist.
    This enables more informative errors when trying to access attributes
-    of a module that does not exists.
+    of a module that does not exist.
    """
    def __init__(self, name: str) -> None:
@ -3109,7 +3109,7 @@ class LazyLoader(types.ModuleType):
    """
    LazyLoader module borrowed from Tensorflow
    https://github.com/tensorflow/tensorflow/blob/main/tensorflow/python/util/lazy_loader.py
-    with a addition of "module caching".
+    with an addition of "module caching".
    Lazily import a module, mainly to avoid pulling in large dependencies.
    Modules such as `xgrammar` might do additional side effects, so we
--- a/vllm/v1/structured_output/init.py
+++ b/vllm/v1/structured_output/init.py
@ -267,7 +267,7 @@ class StructuredOutputManager:
            assert request.structured_output_request is not None
            assert request.structured_output_request.grammar is not None
        # by default, we should always advance
-        # for cases that doesn't uses thinking mode.
+        # for cases that don't use thinking mode.
        if self.reasoner is not None:
            structured_req = request.structured_output_request
@ -276,7 +276,7 @@ class StructuredOutputManager:
            # Check if reasoning ends in *this* step
            if self.reasoner.is_reasoning_end(request.all_token_ids):
-                # Reasoning just ended, so we shouldn't advanced til
+                # Reasoning just ended, so we shouldn't advance til
                # next pass
                structured_req.reasoning_ended = True