mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-03 03:50:05 +08:00
add missing arg
Signed-off-by: vllmellm <vllm.ellm@embeddedllm.com>
This commit is contained in:
parent
b13c4bb25c
commit
7794009661
@ -22,6 +22,7 @@ def flashinfer_w8a8_scaled_mm(
|
|||||||
As: torch.Tensor,
|
As: torch.Tensor,
|
||||||
Bs: torch.Tensor,
|
Bs: torch.Tensor,
|
||||||
bias: torch.Tensor,
|
bias: torch.Tensor,
|
||||||
|
output_shape: list,
|
||||||
) -> torch.Tensor:
|
) -> torch.Tensor:
|
||||||
return flashinfer_scaled_fp8_mm(
|
return flashinfer_scaled_fp8_mm(
|
||||||
A, B, out_dtype=out_dtype, scale_a=As, scale_b=Bs, bias=bias
|
A, B, out_dtype=out_dtype, scale_a=As, scale_b=Bs, bias=bias
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user