forked from pytorch/pytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathnccl.py
76 lines (70 loc) · 2.74 KB
/
nccl.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
import os
import glob
from .env import IS_WINDOWS, IS_DARWIN, IS_CONDA, CONDA_DIR, check_negative_env_flag, \
gather_paths
from .cuda import USE_CUDA, CUDA_HOME
USE_NCCL = USE_CUDA and not check_negative_env_flag('USE_NCCL') and not IS_DARWIN and not IS_WINDOWS
USE_SYSTEM_NCCL = False
NCCL_LIB_DIR = None
NCCL_SYSTEM_LIB = None
NCCL_INCLUDE_DIR = None
NCCL_ROOT_DIR = None
USE_STATIC_NCCL = os.getenv("USE_STATIC_NCCL")
LIBNCCL_PREFIX = "libnccl"
if USE_STATIC_NCCL is not None:
LIBNCCL_PREFIX = "libnccl_static"
if USE_CUDA and not check_negative_env_flag('USE_SYSTEM_NCCL'):
ENV_ROOT = os.getenv('NCCL_ROOT_DIR', None)
LIB_DIR = os.getenv('NCCL_LIB_DIR', None)
INCLUDE_DIR = os.getenv('NCCL_INCLUDE_DIR', None)
lib_paths = list(filter(bool, [
LIB_DIR,
ENV_ROOT,
os.path.join(ENV_ROOT, 'lib') if ENV_ROOT is not None else None,
os.path.join(ENV_ROOT, 'lib', 'x86_64-linux-gnu') if ENV_ROOT is not None else None,
os.path.join(ENV_ROOT, 'lib64') if ENV_ROOT is not None else None,
os.path.join(CUDA_HOME, 'lib'),
os.path.join(CUDA_HOME, 'lib64'),
'/usr/local/lib',
'/usr/lib/x86_64-linux-gnu/',
'/usr/lib/powerpc64le-linux-gnu/',
'/usr/lib/aarch64-linux-gnu/',
'/usr/lib',
] + gather_paths([
'LIBRARY_PATH',
]) + gather_paths([
'LD_LIBRARY_PATH',
])))
include_paths = list(filter(bool, [
INCLUDE_DIR,
ENV_ROOT,
os.path.join(ENV_ROOT, 'include') if ENV_ROOT is not None else None,
os.path.join(CUDA_HOME, 'include'),
'/usr/local/include',
'/usr/include',
]))
if IS_CONDA:
lib_paths.append(os.path.join(CONDA_DIR, 'lib'))
for path in lib_paths:
path = os.path.expanduser(path)
if path is None or not os.path.exists(path):
continue
if glob.glob(os.path.join(path, LIBNCCL_PREFIX + '*')):
NCCL_LIB_DIR = path
# try to find an exact versioned .so/.dylib, rather than libnccl.so
preferred_path = glob.glob(os.path.join(path, LIBNCCL_PREFIX + '*[0-9]*'))
if len(preferred_path) == 0:
NCCL_SYSTEM_LIB = glob.glob(os.path.join(path, LIBNCCL_PREFIX + '*'))[0]
else:
NCCL_SYSTEM_LIB = os.path.realpath(preferred_path[0])
break
for path in include_paths:
path = os.path.expanduser(path)
if path is None or not os.path.exists(path):
continue
if glob.glob(os.path.join(path, 'nccl.h')):
NCCL_INCLUDE_DIR = path
break
if NCCL_LIB_DIR is not None and NCCL_INCLUDE_DIR is not None:
USE_SYSTEM_NCCL = True
NCCL_ROOT_DIR = os.path.commonprefix((NCCL_LIB_DIR, NCCL_INCLUDE_DIR))