mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-24 17:25:51 +08:00
[V1][Minor] Enhance SpecDecoding Metrics Log in V1 (#15902)
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
2039c6305b
commit
274d8e8818
@ -47,13 +47,16 @@ class SpecDecodingMetrics:
|
||||
num_draft_tokens = np.sum(self.num_draft_tokens)
|
||||
num_accepted_tokens = np.sum(self.num_accepted_tokens)
|
||||
|
||||
draft_acceptance_rate = (num_accepted_tokens / num_draft_tokens
|
||||
if num_draft_tokens > 0 else float("nan"))
|
||||
draft_acceptance_rate = (num_accepted_tokens / num_draft_tokens *
|
||||
100 if num_draft_tokens > 0 else float("nan"))
|
||||
|
||||
logger.info(
|
||||
"Speculative metrics: "
|
||||
"Draft acceptance rate: %.3f, "
|
||||
"Number of accepted tokens: %d, "
|
||||
"Number of draft tokens: %d, ", draft_acceptance_rate,
|
||||
num_accepted_tokens, num_draft_tokens)
|
||||
"SpecDecoding metrics: "
|
||||
"Draft acceptance rate: %.1f%%, "
|
||||
"Accepted: %d tokens, "
|
||||
"Drafted: %d tokens",
|
||||
draft_acceptance_rate,
|
||||
num_accepted_tokens,
|
||||
num_draft_tokens,
|
||||
)
|
||||
self.reset()
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user