File tree Expand file tree Collapse file tree 2 files changed +8
-5
lines changed
Expand file tree Collapse file tree 2 files changed +8
-5
lines changed Original file line number Diff line number Diff line change @@ -2329,11 +2329,13 @@ class MemoryProfilingResult:
23292329
23302330 def __repr__ (self ) -> str :
23312331 return (f"Memory profiling takes { self .profile_time :.2f} seconds. "
2332- f"Weights memory: { (self .weights_memory / GiB_bytes ):.2f} GiB; "
2332+ f"Total non KV cache memory: "
2333+ f"{ (self .non_kv_cache_memory / GiB_bytes ):.2f} GiB; "
2334+ f"torch peak memory increase: "
2335+ f"{ (self .torch_peak_increase / GiB_bytes ):.2f} GiB; "
23332336 f"non-torch forward increase memory: "
23342337 f"{ (self .non_torch_increase / GiB_bytes ):.2f} GiB; "
2335- f"torch peak memory: "
2336- f"{ (self .torch_peak_increase / GiB_bytes ):.2f} GiB." )
2338+ f"weights memory: { (self .weights_memory / GiB_bytes ):.2f} GiB." )
23372339
23382340
23392341@contextlib .contextmanager
Original file line number Diff line number Diff line change @@ -218,8 +218,9 @@ def determine_available_memory(self) -> int:
218218
219219 logger .debug (
220220 "Initial free memory: %.2f GiB, free memory: %.2f GiB, "
221- "total GPU memory: %.2f GiB" , GiB (self .init_snapshot .free_memory ),
222- GiB (free_gpu_memory ), GiB (self .init_snapshot .total_memory ))
221+ "requested GPU memory: %.2f GiB" ,
222+ GiB (self .init_snapshot .free_memory ), GiB (free_gpu_memory ),
223+ GiB (self .requested_memory ))
223224 logger .debug (profile_result )
224225 logger .info ("Available KV cache memory: %.2f GiB" ,
225226 GiB (available_kv_cache_memory ))
You can’t perform that action at this time.
0 commit comments