diff --git a/vllm/entrypoints/api_server.py b/vllm/entrypoints/api_server.py index c81ff958531..1c027181156 100644 --- a/vllm/entrypoints/api_server.py +++ b/vllm/entrypoints/api_server.py @@ -111,7 +111,7 @@ async def init_app( engine = (llm_engine if llm_engine is not None else AsyncLLMEngine.from_engine_args( engine_args, usage_context=UsageContext.API_SERVER)) - + app.state.engine_client = engine return app