diff --git a/scripts/launch_triton_server.py b/scripts/launch_triton_server.py index e0dcc2ef..bdd6d7cb 100644 --- a/scripts/launch_triton_server.py +++ b/scripts/launch_triton_server.py @@ -111,4 +111,4 @@ def get_cmd(world_size, tritonserver, grpc_port, http_port, metrics_port, if args.multi_model: assert args.world_size == 1, 'World size must be 1 when using multi-model. Processes will be spawned automatically to run the multi-GPU models' env['TRTLLM_ORCHESTRATOR'] = '1' - subprocess.Popen(cmd, env=env) + subprocess.run(cmd, env=env, check=True)