diff --git a/vllm/distributed/utils.py b/vllm/distributed/utils.py index b8178af5a2d..4206a24465e 100644 --- a/vllm/distributed/utils.py +++ b/vllm/distributed/utils.py @@ -15,7 +15,6 @@ from torch.distributed import ProcessGroup, TCPStore from torch.distributed.distributed_c10d import (Backend, PrefixStore, _get_default_timeout, - _shutdown_backend, _unregister_process_group, is_nccl_available) from torch.distributed.rendezvous import rendezvous @@ -343,5 +342,7 @@ def stateless_destroy_torch_distributed_process_group( Destroy ProcessGroup returned by stateless_init_torch_distributed_process_group(). """ + # Lazy import for non-CUDA backends. + from torch.distributed.distributed_c10d import _shutdown_backend _shutdown_backend(pg) _unregister_process_group(pg.group_name)