diff --git a/vllm/engine/metrics.py b/vllm/engine/metrics.py index 1d8a2d5e01163..8a109696f0b73 100644 --- a/vllm/engine/metrics.py +++ b/vllm/engine/metrics.py @@ -503,7 +503,8 @@ def log(self, stats: Stats) -> None: logger.info( "Cache service hit rate: by tokens: %.2f%%, by blocks: %.2f%%", - stats.cache_service_tokens_hit_rate, stats.cache_service_blocks_hit_rate + stats.cache_service_tokens_hit_rate * 100, + stats.cache_service_blocks_hit_rate * 100, ) # Reset tracked stats for next interval. self.num_prompt_tokens = []