mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-25 18:34:28 +08:00
Fix AWQ MoE marlin check issue in marlin_utils.py for AMD backend (#30102)
Signed-off-by: yuttian1 <yuttian@amd.com>
This commit is contained in:
parent
62079d8600
commit
c4d62618ca
@ -179,6 +179,8 @@ def check_marlin_supports_shape(
|
||||
|
||||
|
||||
def check_marlin_supports_layer(layer: LinearBase, group_size: int) -> bool:
|
||||
if current_platform.is_rocm():
|
||||
return False
|
||||
output_size_per_partition = (
|
||||
getattr(layer, "output_size_per_partition", None) or layer.output_size
|
||||
)
|
||||
@ -195,6 +197,8 @@ def check_marlin_supports_layer(layer: LinearBase, group_size: int) -> bool:
|
||||
|
||||
|
||||
def check_moe_marlin_supports_layer(layer: LinearBase, group_size: int) -> bool:
|
||||
if current_platform.is_rocm():
|
||||
return False
|
||||
hidden_size = layer.hidden_size
|
||||
intermediate_size_per_partition = layer.intermediate_size_per_partition
|
||||
# apply_router_weight_on_input is not supported for moe marlin
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user