[V0][Metrics] Remove unimplemented vllm:tokens_total (#14134)

Signed-off-by: Mark McLoughlin <markmc@redhat.com>
This commit is contained in:
Mark McLoughlin 2025-03-03 17:50:22 +00:00 committed by GitHub
parent 91373a0d15
commit c41d27156b
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -115,10 +115,6 @@ class Metrics:
name="vllm:generation_tokens_total",
documentation="Number of generation tokens processed.",
labelnames=labelnames)
self.counter_tokens = self._counter_cls(
name="vllm:tokens_total",
documentation="Number of prefill plus generation tokens processed.",
labelnames=labelnames)
buckets = [1, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8096]
if not vllm_config.model_config.enforce_eager:
buckets = vllm_config.compilation_config.\