mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-06-04 22:35:45 +08:00
[V0][Metrics] Remove unimplemented vllm:tokens_total (#14134)
Signed-off-by: Mark McLoughlin <markmc@redhat.com>
This commit is contained in:
parent
91373a0d15
commit
c41d27156b
@ -115,10 +115,6 @@ class Metrics:
|
|||||||
name="vllm:generation_tokens_total",
|
name="vllm:generation_tokens_total",
|
||||||
documentation="Number of generation tokens processed.",
|
documentation="Number of generation tokens processed.",
|
||||||
labelnames=labelnames)
|
labelnames=labelnames)
|
||||||
self.counter_tokens = self._counter_cls(
|
|
||||||
name="vllm:tokens_total",
|
|
||||||
documentation="Number of prefill plus generation tokens processed.",
|
|
||||||
labelnames=labelnames)
|
|
||||||
buckets = [1, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8096]
|
buckets = [1, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8096]
|
||||||
if not vllm_config.model_config.enforce_eager:
|
if not vllm_config.model_config.enforce_eager:
|
||||||
buckets = vllm_config.compilation_config.\
|
buckets = vllm_config.compilation_config.\
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user