mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-06 14:07:06 +08:00
add missing arg
Signed-off-by: vllmellm <vllm.ellm@embeddedllm.com>
This commit is contained in:
parent
b13c4bb25c
commit
7794009661
@ -22,6 +22,7 @@ def flashinfer_w8a8_scaled_mm(
|
||||
As: torch.Tensor,
|
||||
Bs: torch.Tensor,
|
||||
bias: torch.Tensor,
|
||||
output_shape: list,
|
||||
) -> torch.Tensor:
|
||||
return flashinfer_scaled_fp8_mm(
|
||||
A, B, out_dtype=out_dtype, scale_a=As, scale_b=Bs, bias=bias
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user