mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-17 06:15:01 +08:00
[BugFix] Fix --disable-log-stats in V1 server mode (#17600)
Signed-off-by: Nick Hill <nhill@redhat.com>
This commit is contained in:
parent
66ab3b13c9
commit
3d13ca0e24
@ -120,6 +120,7 @@ class AsyncLLM(EngineClient):
|
||||
executor_class=executor_class,
|
||||
log_stats=self.log_stats,
|
||||
)
|
||||
if self.stat_loggers:
|
||||
for stat_logger in self.stat_loggers[0]:
|
||||
stat_logger.log_engine_initialized()
|
||||
self.output_handler: Optional[asyncio.Task] = None
|
||||
|
||||
@ -442,9 +442,10 @@ class MPClient(EngineCoreClient):
|
||||
logger.info("Core engine process %d ready.", eng_id)
|
||||
identities.discard(eng_id)
|
||||
# Setup KV cache config with initialization state from
|
||||
# engine core process.
|
||||
self.vllm_config.cache_config.num_gpu_blocks = message_dict[
|
||||
'num_gpu_blocks']
|
||||
# engine core process. Sum values from all engines in DP case.
|
||||
num_gpu_blocks = self.vllm_config.cache_config.num_gpu_blocks or 0
|
||||
num_gpu_blocks += message_dict['num_gpu_blocks']
|
||||
self.vllm_config.cache_config.num_gpu_blocks = num_gpu_blocks
|
||||
|
||||
def _init_core_engines(
|
||||
self,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user