mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 14:53:52 +08:00
[BugFix] Fix DBO hang (#25625)
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
This commit is contained in:
@ -366,7 +366,8 @@ class UBatchWrapper:
|
||||
cudagraph_runtime_mode=CUDAGraphMode.NONE)
|
||||
with self.sm_control:
|
||||
return self._capture_ubatches(ubatch_metadata, self.model)
|
||||
elif num_tokens in self.cudagraphs:
|
||||
elif num_tokens in self.cudagraphs \
|
||||
and cudagraph_runtime_mode is CUDAGraphMode.FULL:
|
||||
cudagraph_metadata = self.cudagraphs[num_tokens]
|
||||
cudagraph_metadata.cudagraph.replay()
|
||||
return cudagraph_metadata.outputs
|
||||
|
Reference in New Issue
Block a user