mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-29 05:27:04 +08:00
Fix AWQ MoE marlin check issue in marlin_utils.py for AMD backend (#30102)
Signed-off-by: yuttian1 <yuttian@amd.com>
This commit is contained in:
parent
62079d8600
commit
c4d62618ca
@ -179,6 +179,8 @@ def check_marlin_supports_shape(
|
|||||||
|
|
||||||
|
|
||||||
def check_marlin_supports_layer(layer: LinearBase, group_size: int) -> bool:
|
def check_marlin_supports_layer(layer: LinearBase, group_size: int) -> bool:
|
||||||
|
if current_platform.is_rocm():
|
||||||
|
return False
|
||||||
output_size_per_partition = (
|
output_size_per_partition = (
|
||||||
getattr(layer, "output_size_per_partition", None) or layer.output_size
|
getattr(layer, "output_size_per_partition", None) or layer.output_size
|
||||||
)
|
)
|
||||||
@ -195,6 +197,8 @@ def check_marlin_supports_layer(layer: LinearBase, group_size: int) -> bool:
|
|||||||
|
|
||||||
|
|
||||||
def check_moe_marlin_supports_layer(layer: LinearBase, group_size: int) -> bool:
|
def check_moe_marlin_supports_layer(layer: LinearBase, group_size: int) -> bool:
|
||||||
|
if current_platform.is_rocm():
|
||||||
|
return False
|
||||||
hidden_size = layer.hidden_size
|
hidden_size = layer.hidden_size
|
||||||
intermediate_size_per_partition = layer.intermediate_size_per_partition
|
intermediate_size_per_partition = layer.intermediate_size_per_partition
|
||||||
# apply_router_weight_on_input is not supported for moe marlin
|
# apply_router_weight_on_input is not supported for moe marlin
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user