Fix gpt oss weight loading with EP + bf16 (#28765)

Signed-off-by: ashors1 <ashors@nvidia.com>
2026-03-16 14:07:13 +08:00 · 2025-11-16 05:12:45 -08:00 · 2025-11-16 05:12:45 -08:00 · 8d259fad6c
commit 8d259fad6c
parent 3bc1175798
1 changed files with 1 additions and 1 deletions
--- a/vllm/model_executor/models/gpt_oss.py
+++ b/vllm/model_executor/models/gpt_oss.py
@ -494,8 +494,8 @@ class GptOssModel(nn.Module):

    def _load_weights_other(
        self,
-        ep_rank_start: int,
        ep_rank_end: int,
+        ep_rank_start: int,
        heads_per_rank: int,
        head_start: int,
        weights: Iterable[tuple[str, torch.Tensor]],