diff --git a/vllm/engine/async_llm_engine.py b/vllm/engine/async_llm_engine.py index aa7775124224..d6c1c2939873 100644 --- a/vllm/engine/async_llm_engine.py +++ b/vllm/engine/async_llm_engine.py @@ -484,7 +484,7 @@ def from_engine_args(cls, distributed_init_method, placement_group = initialize_cluster( parallel_config, engine_args.engine_use_ray) # Create the async LLM engine. - engine = cls(engine_args.worker_use_ray, + engine = cls(parallel_config.worker_use_ray, engine_args.engine_use_ray, *engine_configs, distributed_init_method,