[V1][Minor] Enhance SpecDecoding Metrics Log in V1 (#15902)
Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
This commit is contained in:
@ -47,13 +47,16 @@ class SpecDecodingMetrics:
|
||||
num_draft_tokens = np.sum(self.num_draft_tokens)
|
||||
num_accepted_tokens = np.sum(self.num_accepted_tokens)
|
||||
|
||||
draft_acceptance_rate = (num_accepted_tokens / num_draft_tokens
|
||||
if num_draft_tokens > 0 else float("nan"))
|
||||
draft_acceptance_rate = (num_accepted_tokens / num_draft_tokens *
|
||||
100 if num_draft_tokens > 0 else float("nan"))
|
||||
|
||||
logger.info(
|
||||
"Speculative metrics: "
|
||||
"Draft acceptance rate: %.3f, "
|
||||
"Number of accepted tokens: %d, "
|
||||
"Number of draft tokens: %d, ", draft_acceptance_rate,
|
||||
num_accepted_tokens, num_draft_tokens)
|
||||
"SpecDecoding metrics: "
|
||||
"Draft acceptance rate: %.1f%%, "
|
||||
"Accepted: %d tokens, "
|
||||
"Drafted: %d tokens",
|
||||
draft_acceptance_rate,
|
||||
num_accepted_tokens,
|
||||
num_draft_tokens,
|
||||
)
|
||||
self.reset()
|
||||
|
||||
Reference in New Issue
Block a user