diff --git a/vllm/model_executor/layers/fused_moe/layer.py b/vllm/model_executor/layers/fused_moe/layer.py index e95eeba5e411a..9770f02e192d2 100644 --- a/vllm/model_executor/layers/fused_moe/layer.py +++ b/vllm/model_executor/layers/fused_moe/layer.py @@ -274,6 +274,7 @@ class FusedMoEMethodBase(QuantizeMethodBase): handle = all2all_manager.get_handle(all_to_all_args) + logger.debug("PplxPrepareAndFinalize") prepare_finalize = PplxPrepareAndFinalize( handle, max_num_tokens=moe.max_num_tokens,