diff --git a/vllm/v1/metrics/loggers.py b/vllm/v1/metrics/loggers.py index 21280b9c84cf2..cb36e7973650e 100644 --- a/vllm/v1/metrics/loggers.py +++ b/vllm/v1/metrics/loggers.py @@ -494,6 +494,7 @@ class PrometheusStatLogger(AggregateStatLoggerBase): gauge_kv_cache_usage = self._gauge_cls( name="vllm:kv_cache_usage_perc", documentation="KV-cache usage. 1 means 100 percent usage.", + multiprocess_mode="mostrecent", labelnames=labelnames, ) self.gauge_kv_cache_usage = make_per_engine(