Skip to content

Commit c745540

Browse files
fix
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
1 parent c79cdc4 commit c745540

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

vllm/v1/worker/gpu_model_runner.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3047,8 +3047,10 @@ def _dummy_run(
30473047
BatchDescriptor(num_tokens=num_tokens,
30483048
uniform_decode=uniform_decode))
30493049
if cudagraph_runtime_mode is not None:
3050-
# sanity check
3051-
assert cudagraph_runtime_mode == _cg_mode, (
3050+
# we allow forcing NONE when the dispatcher disagrees to support
3051+
# warm ups for cudagraph capture
3052+
assert cudagraph_runtime_mode == CUDAGraphMode.NONE or \
3053+
cudagraph_runtime_mode == _cg_mode, (
30523054
f"Cudagraph runtime mode mismatch at dummy_run. "
30533055
f"Expected {_cg_mode}, but got {cudagraph_runtime_mode}.")
30543056
else:

0 commit comments

Comments
 (0)