Skip to content

Commit 0bfed0f

Browse files
ji-huazhongsumitd2
authored andcommitted
[MISC] rename CudaMemoryProfiler to DeviceMemoryProfiler (vllm-project#8703)
Signed-off-by: Sumit Dubey <sumit.dubey2@ibm.com>
1 parent bb10904 commit 0bfed0f

File tree

3 files changed

+5
-5
lines changed

3 files changed

+5
-5
lines changed

vllm/utils.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -757,7 +757,7 @@ def is_pin_memory_available() -> bool:
757757
return True
758758

759759

760-
class CudaMemoryProfiler:
760+
class DeviceMemoryProfiler:
761761

762762
def __init__(self, device: Optional[torch.types.Device] = None):
763763
self.device = device

vllm/worker/model_runner.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,7 @@
4545
LRUCacheWorkerPromptAdapterManager)
4646
from vllm.sampling_params import SamplingParams
4747
from vllm.sequence import IntermediateTensors, SequenceGroupMetadata
48-
from vllm.utils import (CudaMemoryProfiler, PyObjectCache, async_tensor_h2d,
48+
from vllm.utils import (DeviceMemoryProfiler, PyObjectCache, async_tensor_h2d,
4949
flatten_2d_lists, is_hip, is_pin_memory_available,
5050
supports_dynamo)
5151
from vllm.worker.model_runner_base import (
@@ -1012,7 +1012,7 @@ def __init__(
10121012

10131013
def load_model(self) -> None:
10141014
logger.info("Starting to load model %s...", self.model_config.model)
1015-
with CudaMemoryProfiler() as m:
1015+
with DeviceMemoryProfiler() as m:
10161016
self.model = get_model(model_config=self.model_config,
10171017
device_config=self.device_config,
10181018
load_config=self.load_config,

vllm/worker/xpu_model_runner.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121
MultiModalInputs, MultiModalRegistry)
2222
from vllm.sampling_params import SamplingParams
2323
from vllm.sequence import IntermediateTensors, SequenceGroupMetadata
24-
from vllm.utils import CudaMemoryProfiler, make_tensor_with_pad
24+
from vllm.utils import DeviceMemoryProfiler, make_tensor_with_pad
2525
from vllm.worker.model_runner import AttentionMetadata, SamplingMetadata
2626
from vllm.worker.model_runner_base import (
2727
ModelRunnerBase, ModelRunnerInputBase, ModelRunnerInputBuilderBase,
@@ -391,7 +391,7 @@ def __init__(
391391
self.model: nn.Module # Set after init_Model
392392

393393
def load_model(self) -> None:
394-
with CudaMemoryProfiler() as m:
394+
with DeviceMemoryProfiler() as m:
395395
self.model = get_model(
396396
model_config=self.model_config,
397397
device_config=self.device_config,

0 commit comments

Comments
 (0)