diff --git a/vllm/platforms/rocm.py b/vllm/platforms/rocm.py index 6e75e8659b727..c4bc763719459 100644 --- a/vllm/platforms/rocm.py +++ b/vllm/platforms/rocm.py @@ -230,4 +230,4 @@ def get_current_memory_usage(cls, device: Optional[torch.types.Device] = None ) -> float: torch.cuda.reset_peak_memory_stats(device) - return torch.cuda.max_memory_allocated(device) + return torch.cuda.mem_get_info()[1] - torch.cuda.mem_get_info()[0] \ No newline at end of file