mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-14 17:26:02 +08:00
[Qwen] Remove cuda hard-code in qwen3 next (#25243)
Signed-off-by: Icey <1790571317@qq.com>
This commit is contained in:
parent
5089fd749c
commit
838d7116ba
@ -306,7 +306,7 @@ class Qwen3NextGatedDeltaNet(nn.Module, MambaBase):
|
|||||||
eps=self.layer_norm_epsilon,
|
eps=self.layer_norm_epsilon,
|
||||||
group_size=None,
|
group_size=None,
|
||||||
norm_before_gate=True,
|
norm_before_gate=True,
|
||||||
device=torch.cuda.current_device(),
|
device=current_platform.current_device(),
|
||||||
dtype=config.torch_dtype,
|
dtype=config.torch_dtype,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user