diff --git a/vllm/distributed/device_communicators/custom_all_reduce_utils.py b/vllm/distributed/device_communicators/custom_all_reduce_utils.py index 24ef3cb45b19d..4b89a23dfc463 100644 --- a/vllm/distributed/device_communicators/custom_all_reduce_utils.py +++ b/vllm/distributed/device_communicators/custom_all_reduce_utils.py @@ -166,7 +166,7 @@ def gpu_p2p_access_check(i: int, j: int) -> bool: and (not os.path.exists(path))): # only the local master process (with local_rank == 0) can # enter this block to calculate the cache - logger.info("generating GPU P2P access cache for in %s", path) + logger.info("generating GPU P2P access cache in %s", path) cache = {} for _i in range(num_dev): for _j in range(num_dev):