mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-04-02 01:27:03 +08:00
updated
Signed-off-by: Robert Shaw <robshaw@redhat.com>
This commit is contained in:
parent
d9291f998e
commit
876c864d3c
@ -168,8 +168,17 @@ class PrometheusStatLogger(StatLoggerBase):
|
||||
model_name = vllm_config.model_config.served_model_name
|
||||
max_model_len = vllm_config.model_config.max_model_len
|
||||
|
||||
# self.spec_decoding_prom = self._spec_decoding_cls(
|
||||
# vllm_config.speculative_config, labelnames, labelvalues)
|
||||
if len(self.engine_indexes) > 1:
|
||||
raise NotImplementedError("Prometheus metrics with Spec Decoding "
|
||||
"with >1 EngineCore per AsyncLLM is not "
|
||||
"supported yet.")
|
||||
spec_decode_labelvalues = [
|
||||
vllm_config.model_config.served_model_name,
|
||||
str(self.engine_indexes[0])
|
||||
]
|
||||
self.spec_decoding_prom = self._spec_decoding_cls(
|
||||
vllm_config.speculative_config, labelnames,
|
||||
spec_decode_labelvalues)
|
||||
|
||||
#
|
||||
# Scheduler state
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user