[model] make llama4 compatible with pure dense layers (#17315)

Signed-off-by: Lucia Fang <fanglu@fb.com>
2025-12-10 09:01:40 +08:00 · 2025-04-28 19:22:22 -07:00 · 2025-04-28 19:22:22 -07:00 · b4ac4fa04d
commit b4ac4fa04d
parent e136000595
1 changed files with 2 additions and 2 deletions
--- a/vllm/model_executor/models/llama4.py
+++ b/vllm/model_executor/models/llama4.py
@ -273,8 +273,8 @@ class Llama4DecoderLayer(nn.Module):
            cache_config=cache_config,
            prefix=f"{prefix}.self_attn",
        )
-        is_moe_layer = (self.layer_idx +
+        is_moe_layer = config.interleave_moe_layer_step > 0 and (
-                        1) % config.interleave_moe_layer_step == 0
+            self.layer_idx + 1) % config.interleave_moe_layer_step == 0
        if is_moe_layer:
            self.feed_forward = Llama4MoE(
                config=config,