mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-02 09:37:53 +08:00
remove modular kernel
Signed-off-by: Sage Moore <sage@neuralmagic.com>
This commit is contained in:
parent
6645882e95
commit
d6eca0c130
@ -3,7 +3,6 @@ from abc import ABC, abstractmethod
|
|||||||
from typing import Optional
|
from typing import Optional
|
||||||
|
|
||||||
import torch
|
import torch
|
||||||
from vllm.v1.worker.ubatching import get_current_ubatch_context, dump_ubatching_state
|
|
||||||
|
|
||||||
#
|
#
|
||||||
# This file defines a set of base classes used to make MoE kernels more modular.
|
# This file defines a set of base classes used to make MoE kernels more modular.
|
||||||
@ -359,9 +358,6 @@ class FusedMoEModularKernel(torch.nn.Module):
|
|||||||
expert_num_tokens=expert_num_tokens,
|
expert_num_tokens=expert_num_tokens,
|
||||||
)
|
)
|
||||||
|
|
||||||
# if (ubatch_ctx := get_current_ubatch_context()) is not None:
|
|
||||||
# print("in modular moe3, ubatch:", ubatch_ctx.id, self.fused_experts)
|
|
||||||
|
|
||||||
self.prepare_finalize.finalize(output, fused_out, topk_weights,
|
self.prepare_finalize.finalize(output, fused_out, topk_weights,
|
||||||
topk_ids, apply_router_weight_on_input)
|
topk_ids, apply_router_weight_on_input)
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user