mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-10 22:46:01 +08:00
[Misc] Improve memory profiling debug message (#21429)
Signed-off-by: Ye (Charlotte) Qi <yeq@meta.com>
This commit is contained in:
parent
c215f5c877
commit
a40a8506df
@ -246,11 +246,21 @@ class Worker(WorkerBase):
|
|||||||
available_kv_cache_memory = self.requested_memory \
|
available_kv_cache_memory = self.requested_memory \
|
||||||
- profile_result.non_kv_cache_memory
|
- profile_result.non_kv_cache_memory
|
||||||
|
|
||||||
|
unrequested_memory = self.init_snapshot.free_memory \
|
||||||
|
- self.requested_memory
|
||||||
logger.debug(
|
logger.debug(
|
||||||
"Initial free memory: %.2f GiB, free memory: %.2f GiB, "
|
"Initial free memory: %.2f GiB; "
|
||||||
"requested GPU memory: %.2f GiB",
|
"Requested memory: %.2f (util), %.2f GiB",
|
||||||
GiB(self.init_snapshot.free_memory), GiB(free_gpu_memory),
|
GiB(self.init_snapshot.free_memory),
|
||||||
GiB(self.requested_memory))
|
self.cache_config.gpu_memory_utilization,
|
||||||
|
GiB(self.requested_memory),
|
||||||
|
)
|
||||||
|
logger.debug(
|
||||||
|
"Free memory after profiling: %.2f GiB (total), "
|
||||||
|
"%.2f GiB (within requested)",
|
||||||
|
GiB(free_gpu_memory),
|
||||||
|
GiB(free_gpu_memory - unrequested_memory),
|
||||||
|
)
|
||||||
logger.debug(profile_result)
|
logger.debug(profile_result)
|
||||||
logger.info("Available KV cache memory: %.2f GiB",
|
logger.info("Available KV cache memory: %.2f GiB",
|
||||||
GiB(available_kv_cache_memory))
|
GiB(available_kv_cache_memory))
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user