diff --git a/vllm/executor/multiproc_gpu_executor.py b/vllm/executor/multiproc_gpu_executor.py index 7b98fbea5cd0a..02b2499be4656 100644 --- a/vllm/executor/multiproc_gpu_executor.py +++ b/vllm/executor/multiproc_gpu_executor.py @@ -126,7 +126,7 @@ def shutdown(signum, frame): max_parallel_loading_workers) def _check_executor_parameters(self): - world_size = self.parallel_config.tensor_parallel_size + world_size = self.parallel_config.world_size tensor_parallel_size = self.parallel_config.tensor_parallel_size # Set CUDA_VISIBLE_DEVICES for the driver, inherited by workers