From f6c91d6896a018a1a1792465574248ef7ba33d65 Mon Sep 17 00:00:00 2001 From: Le Xu Date: Thu, 26 Dec 2024 17:23:29 -0800 Subject: [PATCH] fix metrics percentage print --- vllm/engine/metrics.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/vllm/engine/metrics.py b/vllm/engine/metrics.py index 1d8a2d5e01163..8a109696f0b73 100644 --- a/vllm/engine/metrics.py +++ b/vllm/engine/metrics.py @@ -503,7 +503,8 @@ def log(self, stats: Stats) -> None: logger.info( "Cache service hit rate: by tokens: %.2f%%, by blocks: %.2f%%", - stats.cache_service_tokens_hit_rate, stats.cache_service_blocks_hit_rate + stats.cache_service_tokens_hit_rate * 100, + stats.cache_service_blocks_hit_rate * 100, ) # Reset tracked stats for next interval. self.num_prompt_tokens = []