Skip to content

Commit db39576

Browse files
committed
minor refine
1 parent a96e720 commit db39576

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

vllm/config.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -941,14 +941,17 @@ def _maybe_override_draft_max_model_len(
941941
@staticmethod
942942
def create_draft_parallel_config(
943943
target_parallel_config: ParallelConfig,
944-
speculative_tensor_parallel_size: int) -> ParallelConfig:
944+
speculative_tensor_parallel_size: Optional[int]) -> ParallelConfig:
945945
"""Create a parallel config for use by the draft worker.
946946
947947
This is mostly a copy of the target parallel config.
948948
"""
949+
950+
_speculative_tensor_parallel_size = speculative_tensor_parallel_size or target_parallel_config.tensor_parallel_size
951+
949952
draft_parallel_config = ParallelConfig(
950953
pipeline_parallel_size=target_parallel_config.pipeline_parallel_size,
951-
tensor_parallel_size=target_parallel_config.tensor_parallel_size,
954+
tensor_parallel_size=_speculative_tensor_parallel_size,
952955
distributed_executor_backend=target_parallel_config.
953956
distributed_executor_backend,
954957
max_parallel_loading_workers=target_parallel_config.
@@ -961,9 +964,6 @@ def create_draft_parallel_config(
961964
placement_group=target_parallel_config.placement_group,
962965
)
963966

964-
if speculative_tensor_parallel_size is not None:
965-
draft_parallel_config.tensor_parallel_size = speculative_tensor_parallel_size
966-
967967
return draft_parallel_config
968968

969969
def __init__(

0 commit comments

Comments
 (0)