[V1][Spec Decoding] Log accumulated metrics after system goes idle (#17913)

Signed-off-by: Mark McLoughlin <markmc@redhat.com>
2025-12-22 02:35:40 +08:00 · 2025-05-10 02:23:07 +01:00 · 2025-05-10 02:23:07 +01:00 · 7042cc96b0
commit 7042cc96b0
parent 0c0fdae84f
2 changed files with 3 additions and 3 deletions
--- a/vllm/v1/metrics/loggers.py
+++ b/vllm/v1/metrics/loggers.py
@ -128,8 +128,6 @@ class LoggingStatLogger(StatLoggerBase):
            scheduler_stats.gpu_cache_usage * 100,
            self.prefix_caching_metrics.hit_rate * 100,
        )
        if scheduler_stats.spec_decoding_stats is not None:
        self.spec_decoding_logging.log(log_fn=log_fn)
    def log_engine_initialized(self):
--- a/vllm/v1/spec_decode/metrics.py
+++ b/vllm/v1/spec_decode/metrics.py
@ -67,6 +67,8 @@ class SpecDecodingLogging:
            spec_decoding_stats.num_accepted_tokens_per_pos)
    def log(self, log_fn=logger.info):
        if not self.num_drafts:
            return
        num_drafts = np.sum(self.num_drafts)
        num_draft_tokens = np.sum(self.num_draft_tokens)
        num_accepted_tokens = np.sum(self.num_accepted_tokens)