comment

Signed-off-by: Roger Wang <[email protected]>
vllm-project · Oct 31, 2024 · 5a4b59c · 5a4b59c
1 parent 5905c0e
commit 5a4b59c
Showing 1 changed file with 1 addition and 1 deletion.
diff --git a/vllm/worker/model_runner.py b/vllm/worker/model_runner.py
@@ -995,7 +995,7 @@ def __init__(
         # Python can be expensive. To optimize this, we cache the block table
         # in numpy and only copy the actual input content at every iteration.
         # The shape of the cached block table will be
-        # (max batch size to capture, max context len to capture / block size).
+        # (max batch size to capture, max seq len to capture / block size).
         self.graph_block_tables = np.zeros(
             (self.max_batchsize_to_capture, self.get_max_block_per_batch()),
             dtype=np.int32)