diff --git a/vllm/entrypoints/openai/rpc/server.py b/vllm/entrypoints/openai/rpc/server.py index e72d039d315ad..af406d8715403 100644 --- a/vllm/entrypoints/openai/rpc/server.py +++ b/vllm/entrypoints/openai/rpc/server.py @@ -3,6 +3,7 @@ from typing import Any, Coroutine import cloudpickle +import uvloop import zmq import zmq.asyncio from typing_extensions import Never @@ -217,4 +218,4 @@ def signal_handler() -> None: def run_rpc_server(async_engine_args: AsyncEngineArgs, usage_context: UsageContext, rpc_path: str): server = AsyncEngineRPCServer(async_engine_args, usage_context, rpc_path) - asyncio.run(run_server(server)) + uvloop.run(run_server(server))