From 31ba41fd49e32edde4ffc532fdad56c252931b56 Mon Sep 17 00:00:00 2001 From: Sourashis Roy Date: Fri, 20 Dec 2024 05:26:57 +0000 Subject: [PATCH] Rerun tests Signed-off-by: Sourashis Roy --- vllm/v1/worker/gpu_input_batch.py | 1 - 1 file changed, 1 deletion(-) diff --git a/vllm/v1/worker/gpu_input_batch.py b/vllm/v1/worker/gpu_input_batch.py index fcb1df1d27928..dcbb7b7825aa5 100644 --- a/vllm/v1/worker/gpu_input_batch.py +++ b/vllm/v1/worker/gpu_input_batch.py @@ -395,7 +395,6 @@ def _construct_prompt_tokens_tensor( # TODO - Add a method in vllm/utils.py to pad a numpy array similar # to make_tensor_with_pad which takes a list and move the logic # there. - padded_prompts = np.full((self.num_reqs, max_prompt_len), vocab_size, dtype=np.int64)