diff --git a/vllm/v1/spec_decode/metrics.py b/vllm/v1/spec_decode/metrics.py index 7fecbaeed4f..7bb3c209d1d 100644 --- a/vllm/v1/spec_decode/metrics.py +++ b/vllm/v1/spec_decode/metrics.py @@ -47,13 +47,16 @@ def log(self): num_draft_tokens = np.sum(self.num_draft_tokens) num_accepted_tokens = np.sum(self.num_accepted_tokens) - draft_acceptance_rate = (num_accepted_tokens / num_draft_tokens - if num_draft_tokens > 0 else float("nan")) + draft_acceptance_rate = (num_accepted_tokens / num_draft_tokens * + 100 if num_draft_tokens > 0 else float("nan")) logger.info( - "Speculative metrics: " - "Draft acceptance rate: %.3f, " - "Number of accepted tokens: %d, " - "Number of draft tokens: %d, ", draft_acceptance_rate, - num_accepted_tokens, num_draft_tokens) + "SpecDecoding metrics: " + "Draft acceptance rate: %.1f%%, " + "Accepted: %d tokens, " + "Drafted: %d tokens", + draft_acceptance_rate, + num_accepted_tokens, + num_draft_tokens, + ) self.reset()