[V1] Default MLA to V1 (#14921)

Signed-off-by: simon-mo <simon.mo@hey.com>
2026-03-17 13:07:11 +08:00 · 2025-03-17 06:54:40 -07:00 · 2025-03-17 06:54:40 -07:00 · 89fca671fb
commit 89fca671fb
parent d20b0c139c
1 changed files with 1 additions and 5 deletions
--- a/vllm/engine/arg_utils.py
+++ b/vllm/engine/arg_utils.py
@ -1191,7 +1191,7 @@ class EngineArgs:
        NOTE: for autoselection of V0 vs V1 engine, we need to
        create the ModelConfig first, since ModelConfig's attrs
        (e.g. the model arch) are needed to make the decision.
-        
+
        This function set VLLM_USE_V1=X if VLLM_USE_V1 is
        unspecified by the user.

@ -1576,10 +1576,6 @@ class EngineArgs:
        #############################################################
        # Experimental Features - allow users to opt in.

-        # MLA is is supported on V1, but off by default for now.
-        if model_config.use_mla and _warn_or_fallback("MLA"):
-            return False
-
        # LoRA is supported on V1, but off by default for now.
        if self.enable_lora and _warn_or_fallback("LORA"):
            return False