diff --git a/vllm/engine/metrics.py b/vllm/engine/metrics.py index d3560f5fefff1..eb54f5641171e 100644 --- a/vllm/engine/metrics.py +++ b/vllm/engine/metrics.py @@ -230,8 +230,8 @@ class StatLogger: "Avg prompt throughput: %.1f tokens/s, " "Avg generation throughput: %.1f tokens/s, " "Running: %d reqs, Swapped: %d reqs, " - "Pending: %d reqs, GPU KV cache usage: %.1f%, " - "CPU KV cache usage: %.1f%", + "Pending: %d reqs, GPU KV cache usage: %.1f%%, " + "CPU KV cache usage: %.1f%%", prompt_throughput, generation_throughput, stats.num_running,