From c41d27156b7c9123bd38387afca639631dfc2ed0 Mon Sep 17 00:00:00 2001 From: Mark McLoughlin Date: Mon, 3 Mar 2025 17:50:22 +0000 Subject: [PATCH] [V0][Metrics] Remove unimplemented `vllm:tokens_total` (#14134) Signed-off-by: Mark McLoughlin --- vllm/engine/metrics.py | 4 ---- 1 file changed, 4 deletions(-) diff --git a/vllm/engine/metrics.py b/vllm/engine/metrics.py index cb3ca7a118819..9379ba6146316 100644 --- a/vllm/engine/metrics.py +++ b/vllm/engine/metrics.py @@ -115,10 +115,6 @@ class Metrics: name="vllm:generation_tokens_total", documentation="Number of generation tokens processed.", labelnames=labelnames) - self.counter_tokens = self._counter_cls( - name="vllm:tokens_total", - documentation="Number of prefill plus generation tokens processed.", - labelnames=labelnames) buckets = [1, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8096] if not vllm_config.model_config.enforce_eager: buckets = vllm_config.compilation_config.\