mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-12 06:37:03 +08:00
fix
Signed-off-by: Bill Nell <bnell@redhat.com>
This commit is contained in:
parent
c169b05541
commit
cad6447664
@ -274,6 +274,7 @@ class FusedMoEMethodBase(QuantizeMethodBase):
|
||||
|
||||
handle = all2all_manager.get_handle(all_to_all_args)
|
||||
|
||||
logger.debug("PplxPrepareAndFinalize")
|
||||
prepare_finalize = PplxPrepareAndFinalize(
|
||||
handle,
|
||||
max_num_tokens=moe.max_num_tokens,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user