mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-08 21:56:29 +08:00
[Misc] DeepEPHighThroughtput - Enable Inductor pass (#21311)
Signed-off-by: Varun Sundar Rabindranath <vsundarr@redhat.com> Co-authored-by: Varun Sundar Rabindranath <vsundarr@redhat.com>
This commit is contained in:
parent
c17231e827
commit
8425f785ad
@ -182,9 +182,6 @@ class CudaPlatformBase(Platform):
|
||||
compilation_config.use_cudagraph = False
|
||||
if model_config is not None:
|
||||
model_config.enforce_eager = True
|
||||
# TODO (varun): Turning this ON gives incorrect results for the
|
||||
# Deepseek-V2-lite model.
|
||||
vllm_config.compilation_config.use_inductor = False
|
||||
|
||||
@classmethod
|
||||
def get_current_memory_usage(cls,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user