From 5687d584fe4825d59a6fd9ecc5840e1df04e380f Mon Sep 17 00:00:00 2001 From: ljss <31004720+beginlner@users.noreply.github.com> Date: Wed, 1 Nov 2023 17:14:18 +0800 Subject: [PATCH] [BugFix] Set engine_use_ray=True when TP>1 (#1531) --- vllm/engine/async_llm_engine.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/engine/async_llm_engine.py b/vllm/engine/async_llm_engine.py index aa7775124224..d6c1c2939873 100644 --- a/vllm/engine/async_llm_engine.py +++ b/vllm/engine/async_llm_engine.py @@ -484,7 +484,7 @@ def from_engine_args(cls, distributed_init_method, placement_group = initialize_cluster( parallel_config, engine_args.engine_use_ray) # Create the async LLM engine. - engine = cls(engine_args.worker_use_ray, + engine = cls(parallel_config.worker_use_ray, engine_args.engine_use_ray, *engine_configs, distributed_init_method,