mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-26 23:07:55 +08:00
[Quantization] enable compressed-tensors marlin support for turing (#31000)
Signed-off-by: Jinzhen Lin <jinzhen.ljz@antgroup.com>
This commit is contained in:
parent
2ac85a4544
commit
de08b8f61b
@ -30,7 +30,7 @@ from .MPLinearKernel import MPLinearKernel, MPLinearLayerConfig
|
|||||||
class MarlinLinearKernel(MPLinearKernel):
|
class MarlinLinearKernel(MPLinearKernel):
|
||||||
@classmethod
|
@classmethod
|
||||||
def get_min_capability(cls) -> int:
|
def get_min_capability(cls) -> int:
|
||||||
return 80
|
return 75
|
||||||
|
|
||||||
@classmethod
|
@classmethod
|
||||||
def can_implement(cls, c: MPLinearLayerConfig) -> tuple[bool, str | None]:
|
def can_implement(cls, c: MPLinearLayerConfig) -> tuple[bool, str | None]:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user