From bde9e2272a28342d30fe9c4de4c1c9633ff153d8 Mon Sep 17 00:00:00 2001 From: Tao He Date: Fri, 17 Oct 2025 11:37:52 +0800 Subject: [PATCH] [Bugfix][Qwen] fixes the weights dtype in qwen3_next: it is actually a bfloat16 (#27030) Signed-off-by: Tao He --- vllm/model_executor/models/qwen3_next.py | 1 - 1 file changed, 1 deletion(-) diff --git a/vllm/model_executor/models/qwen3_next.py b/vllm/model_executor/models/qwen3_next.py index 27e7a3ead45d0..f891a4961dd70 100644 --- a/vllm/model_executor/models/qwen3_next.py +++ b/vllm/model_executor/models/qwen3_next.py @@ -325,7 +325,6 @@ class Qwen3NextGatedDeltaNet(nn.Module, MambaBase): self.A_log = nn.Parameter( torch.empty( divide(self.num_v_heads, self.tp_size), - dtype=torch.float32, ) )