mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-01-09 10:51:51 +08:00
[BugFix] Fix DBO hang (#25625)
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com> Signed-off-by: yewentao256 <zhyanwentao@126.com>
This commit is contained in:
parent
0cee734ab4
commit
fe6357a780
@ -366,7 +366,8 @@ class UBatchWrapper:
|
||||
cudagraph_runtime_mode=CUDAGraphMode.NONE)
|
||||
with self.sm_control:
|
||||
return self._capture_ubatches(ubatch_metadata, self.model)
|
||||
elif num_tokens in self.cudagraphs:
|
||||
elif num_tokens in self.cudagraphs \
|
||||
and cudagraph_runtime_mode is CUDAGraphMode.FULL:
|
||||
cudagraph_metadata = self.cudagraphs[num_tokens]
|
||||
cudagraph_metadata.cudagraph.replay()
|
||||
return cudagraph_metadata.outputs
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user