Skip to content

Commit 100b3fd

Browse files
fix mtp
Signed-off-by: Lucas Wilkinson <lwilkins@redhat.com>
1 parent c3e2978 commit 100b3fd

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

vllm/config/compilation.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -917,7 +917,7 @@ def adjust_cudagraph_sizes_for_spec_decode(
917917
self, uniform_decode_query_len: int, tensor_parallel_size: int
918918
):
919919
multiple_of = uniform_decode_query_len
920-
if tensor_parallel_size > 1:
920+
if tensor_parallel_size > 1 and self.pass_config.enable_sequence_parallelism:
921921
multiple_of = max(uniform_decode_query_len, tensor_parallel_size)
922922
if (
923923
multiple_of % uniform_decode_query_len != 0

0 commit comments

Comments
 (0)