mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-25 10:36:32 +08:00
[Bugfix] Restrict Machete to only run on Hopper (#20830)
Signed-off-by: mgoin <mgoin64@gmail.com>
This commit is contained in:
parent
a86754a12b
commit
6e2c176e1f
@ -32,6 +32,9 @@ class MacheteLinearKernel(MPLinearKernel):
|
||||
if not current_platform.is_cuda():
|
||||
return False, "Machete only supported on CUDA"
|
||||
|
||||
if not current_platform.is_device_capability(90):
|
||||
return False, "Machete requires compute capability of 90 (Hopper)"
|
||||
|
||||
if c.has_g_idx and\
|
||||
c.partition_weight_shape[0] != c.full_weight_shape[0]:
|
||||
return False, "Act reordering currently not supported by Machete, "\
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user