Skip to content

Commit eb6cbdd

Browse files
committed
minor improvement
Signed-off-by: Ye (Charlotte) Qi <[email protected]>
1 parent 83247be commit eb6cbdd

File tree

2 files changed

+8
-5
lines changed

2 files changed

+8
-5
lines changed

vllm/utils.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2329,11 +2329,13 @@ class MemoryProfilingResult:
23292329

23302330
def __repr__(self) -> str:
23312331
return (f"Memory profiling takes {self.profile_time:.2f} seconds. "
2332-
f"Weights memory: {(self.weights_memory / GiB_bytes):.2f}GiB; "
2332+
f"Total non KV cache memory: "
2333+
f"{(self.non_kv_cache_memory / GiB_bytes):.2f}GiB; "
2334+
f"torch peak memory increase: "
2335+
f"{(self.torch_peak_increase / GiB_bytes):.2f}GiB; "
23332336
f"non-torch forward increase memory: "
23342337
f"{(self.non_torch_increase / GiB_bytes):.2f}GiB; "
2335-
f"torch peak memory: "
2336-
f"{(self.torch_peak_increase / GiB_bytes):.2f}GiB.")
2338+
f"weights memory: {(self.weights_memory / GiB_bytes):.2f}GiB.")
23372339

23382340

23392341
@contextlib.contextmanager

vllm/v1/worker/gpu_worker.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -218,8 +218,9 @@ def determine_available_memory(self) -> int:
218218

219219
logger.debug(
220220
"Initial free memory: %.2f GiB, free memory: %.2f GiB, "
221-
"total GPU memory: %.2f GiB", GiB(self.init_snapshot.free_memory),
222-
GiB(free_gpu_memory), GiB(self.init_snapshot.total_memory))
221+
"requested GPU memory: %.2f GiB",
222+
GiB(self.init_snapshot.free_memory), GiB(free_gpu_memory),
223+
GiB(self.requested_memory))
223224
logger.debug(profile_result)
224225
logger.info("Available KV cache memory: %.2f GiB",
225226
GiB(available_kv_cache_memory))

0 commit comments

Comments
 (0)