mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-31 03:27:04 +08:00
[V1][Minor] Enhance SpecDecoding Metrics Log in V1 (#15902)
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
parent
2039c6305b
commit
274d8e8818
@ -47,13 +47,16 @@ class SpecDecodingMetrics:
|
|||||||
num_draft_tokens = np.sum(self.num_draft_tokens)
|
num_draft_tokens = np.sum(self.num_draft_tokens)
|
||||||
num_accepted_tokens = np.sum(self.num_accepted_tokens)
|
num_accepted_tokens = np.sum(self.num_accepted_tokens)
|
||||||
|
|
||||||
draft_acceptance_rate = (num_accepted_tokens / num_draft_tokens
|
draft_acceptance_rate = (num_accepted_tokens / num_draft_tokens *
|
||||||
if num_draft_tokens > 0 else float("nan"))
|
100 if num_draft_tokens > 0 else float("nan"))
|
||||||
|
|
||||||
logger.info(
|
logger.info(
|
||||||
"Speculative metrics: "
|
"SpecDecoding metrics: "
|
||||||
"Draft acceptance rate: %.3f, "
|
"Draft acceptance rate: %.1f%%, "
|
||||||
"Number of accepted tokens: %d, "
|
"Accepted: %d tokens, "
|
||||||
"Number of draft tokens: %d, ", draft_acceptance_rate,
|
"Drafted: %d tokens",
|
||||||
num_accepted_tokens, num_draft_tokens)
|
draft_acceptance_rate,
|
||||||
|
num_accepted_tokens,
|
||||||
|
num_draft_tokens,
|
||||||
|
)
|
||||||
self.reset()
|
self.reset()
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user