|
13 | 13 | from vllm.distributed.device_communicators.pynccl_allocator import ( |
14 | 14 | is_symmetric_memory_enabled, |
15 | 15 | ) |
| 16 | +from vllm.distributed.parallel_state import is_global_first_rank |
16 | 17 | from vllm.logger import init_logger |
17 | 18 | from vllm.platforms import current_platform |
18 | 19 |
|
@@ -95,35 +96,35 @@ def __init__( |
95 | 96 | from .all2all import NaiveAll2AllManager |
96 | 97 |
|
97 | 98 | self.all2all_manager = NaiveAll2AllManager(self.cpu_group) |
98 | | - logger.info("Using naive all2all manager.") |
99 | 99 | elif all2all_backend == "allgather_reducescatter": |
100 | 100 | from .all2all import AgRsAll2AllManager |
101 | 101 |
|
102 | 102 | self.all2all_manager = AgRsAll2AllManager(self.cpu_group) |
103 | | - logger.info("Using AllGather-ReduceScatter all2all manager.") |
104 | 103 | elif all2all_backend == "pplx": |
105 | 104 | from .all2all import PPLXAll2AllManager |
106 | 105 |
|
107 | 106 | self.all2all_manager = PPLXAll2AllManager(self.cpu_group) |
108 | | - logger.info("Using PPLX all2all manager.") |
109 | 107 | elif all2all_backend == "deepep_high_throughput": |
110 | 108 | from .all2all import DeepEPHTAll2AllManager |
111 | 109 |
|
112 | 110 | self.all2all_manager = DeepEPHTAll2AllManager(self.cpu_group) |
113 | | - logger.info("Using DeepEP High-Throughput all2all manager.") |
114 | 111 | elif all2all_backend == "deepep_low_latency": |
115 | 112 | from .all2all import DeepEPLLAll2AllManager |
116 | 113 |
|
117 | 114 | self.all2all_manager = DeepEPLLAll2AllManager(self.cpu_group) |
118 | | - logger.info("Using DeepEP Low-Latency all2all manager.") |
119 | 115 | elif all2all_backend == "flashinfer_all2allv": |
120 | 116 | from .all2all import FlashInferAllToAllManager |
121 | 117 |
|
122 | 118 | self.all2all_manager = FlashInferAllToAllManager(self.cpu_group) |
123 | | - logger.info("Using Flashinfer all2allv manager.") |
124 | 119 | else: |
125 | 120 | raise ValueError(f"Unknown all2all backend: {all2all_backend}") |
126 | 121 |
|
| 122 | + if is_global_first_rank(): |
| 123 | + logger.info( |
| 124 | + "Using %s all2all manager.", |
| 125 | + self.all2all_manager.__class__.__name__, |
| 126 | + ) |
| 127 | + |
127 | 128 | def all_reduce(self, input_): |
128 | 129 | # since currently we perform copy input -> symm_input -> out-of-place AR |
129 | 130 | # return symm_output, we don't need to check if input is symmetric |
|
0 commit comments