mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-03-19 22:07:42 +08:00
updated
Signed-off-by: Robert Shaw <robshaw@redhat.com>
This commit is contained in:
parent
f477b50493
commit
5ea4fa206d
@ -168,7 +168,8 @@ class PrometheusStatLogger(StatLoggerBase):
|
||||
model_name = vllm_config.model_config.served_model_name
|
||||
max_model_len = vllm_config.model_config.max_model_len
|
||||
|
||||
if len(self.engine_indexes) > 1:
|
||||
if (len(self.engine_indexes) > 1
|
||||
and vllm_config.speculative_config is not None):
|
||||
raise NotImplementedError("Prometheus metrics with Spec Decoding "
|
||||
"with >1 EngineCore per AsyncLLM is not "
|
||||
"supported yet.")
|
||||
@ -511,9 +512,9 @@ class PrometheusStatLogger(StatLoggerBase):
|
||||
self.counter_prefix_cache_hits[engine_idx].inc(
|
||||
scheduler_stats.prefix_cache_stats.hits)
|
||||
|
||||
# if scheduler_stats.spec_decoding_stats is not None:
|
||||
# self.spec_decoding_prom.observe(
|
||||
# scheduler_stats.spec_decoding_stats)
|
||||
if scheduler_stats.spec_decoding_stats is not None:
|
||||
self.spec_decoding_prom.observe(
|
||||
scheduler_stats.spec_decoding_stats)
|
||||
|
||||
if iteration_stats is None:
|
||||
return
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user