mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-28 12:07:14 +08:00
[Bugfix][CI/CD][CPU] Fix CPU CI tests (#20383)
Signed-off-by: jiang1.li <jiang1.li@intel.com>
This commit is contained in:
parent
b616f6a53d
commit
0ec3779df7
@ -201,12 +201,13 @@ def apply_w8a8_block_fp8_linear_fake(
|
||||
return torch.empty(output_shape, dtype=input.dtype, device=input.device)
|
||||
|
||||
|
||||
direct_register_custom_op(
|
||||
op_name="apply_w8a8_block_fp8_linear",
|
||||
op_func=apply_w8a8_block_fp8_linear,
|
||||
mutates_args=[],
|
||||
fake_impl=apply_w8a8_block_fp8_linear_fake,
|
||||
)
|
||||
if not current_platform.is_cpu():
|
||||
direct_register_custom_op(
|
||||
op_name="apply_w8a8_block_fp8_linear",
|
||||
op_func=apply_w8a8_block_fp8_linear,
|
||||
mutates_args=[],
|
||||
fake_impl=apply_w8a8_block_fp8_linear_fake,
|
||||
)
|
||||
|
||||
|
||||
def input_to_float8(
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user