Signed-off-by: Robert Shaw <robshaw@redhat.com>
This commit is contained in:
Robert Shaw 2025-07-20 17:17:15 +00:00
parent f477b50493
commit 5ea4fa206d

View File

@ -168,7 +168,8 @@ class PrometheusStatLogger(StatLoggerBase):
model_name = vllm_config.model_config.served_model_name model_name = vllm_config.model_config.served_model_name
max_model_len = vllm_config.model_config.max_model_len max_model_len = vllm_config.model_config.max_model_len
if len(self.engine_indexes) > 1: if (len(self.engine_indexes) > 1
and vllm_config.speculative_config is not None):
raise NotImplementedError("Prometheus metrics with Spec Decoding " raise NotImplementedError("Prometheus metrics with Spec Decoding "
"with >1 EngineCore per AsyncLLM is not " "with >1 EngineCore per AsyncLLM is not "
"supported yet.") "supported yet.")
@ -511,9 +512,9 @@ class PrometheusStatLogger(StatLoggerBase):
self.counter_prefix_cache_hits[engine_idx].inc( self.counter_prefix_cache_hits[engine_idx].inc(
scheduler_stats.prefix_cache_stats.hits) scheduler_stats.prefix_cache_stats.hits)
# if scheduler_stats.spec_decoding_stats is not None: if scheduler_stats.spec_decoding_stats is not None:
# self.spec_decoding_prom.observe( self.spec_decoding_prom.observe(
# scheduler_stats.spec_decoding_stats) scheduler_stats.spec_decoding_stats)
if iteration_stats is None: if iteration_stats is None:
return return