blob: 2e30a867a7768aa7616377c7bd6dbe341722a247 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
|
RESOURCES_LIBRARY()
# https://wiki.yandex-team.ru/devtools/cuda/
OWNER(g:contrib somov)
IF (NOT HAVE_CUDA)
MESSAGE(FATAL_ERROR "No CUDA Toolkit for your build")
ENDIF()
IF (USE_ARCADIA_CUDA)
IF (HOST_OS_LINUX AND HOST_ARCH_X86_64)
IF (OS_LINUX AND ARCH_X86_64)
IF (CUDA_VERSION == "11.4")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:2410761119) # CUDA Toolkit 11.4.2 for Linux x86-64
ELSEIF (CUDA_VERSION == "11.3")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:2213063565) # CUDA Toolkit 11.3.1 for Linux x86-64
ELSEIF (CUDA_VERSION == "11.0")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:1647896014) # CUDA Toolkit 11.0.2 for Linux x86-64
ELSEIF (CUDA_VERSION == "10.1")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:2077988857) # CUDA Toolkit 10.1.168 for Linux x86-64
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ELSEIF(OS_LINUX AND ARCH_AARCH64)
IF (CUDA_VERSION == "11.3")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:2227720086) # CUDA Toolkit 11.3.20210513 (11.3.1) for Linux x86-64 with linux-aarch64 support
# host tools installer https://sandbox.yandex-team.ru/resource/2227828799/view
# cross compile parts installer https://sandbox.yandex-team.ru/resource/2227885870/view
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ELSEIF (HOST_OS_LINUX AND HOST_ARCH_PPC64LE)
IF (OS_LINUX AND ARCH_PPC64LE)
IF (CUDA_VERSION == "10.1")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:1586537264) # CUDA Toolkit 10.1.168 for Linux ppc64le
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ELSEIF (HOST_OS_DARWIN AND HOST_ARCH_X86_64)
IF (OS_DARWIN AND ARCH_X86_64)
IF (CUDA_VERSION == "10.1")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:978727023) # CUDA Toolkit 10.1.168 for macOS x86-64
ENDIF()
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ELSEIF (HOST_OS_WINDOWS AND HOST_ARCH_X86_64)
IF (OS_WINDOWS AND ARCH_X86_64)
IF (CUDA_VERSION == "11.3")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:2215101513) # CUDA Toolkit 11.3.1 for Windows x86-64
ELSEIF (CUDA_VERSION == "10.1")
DECLARE_EXTERNAL_RESOURCE(CUDA sbr:978734165) # CUDA Toolkit 10.1.168 for Windows x86-64
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ELSE()
ENABLE(CUDA_NOT_FOUND)
ENDIF()
ENDIF()
IF (USE_ARCADIA_CUDA_HOST_COMPILER)
IF (HOST_OS_LINUX AND HOST_ARCH_X86_64)
IF (OS_LINUX AND ARCH_X86_64)
DECLARE_EXTERNAL_RESOURCE(CUDA_HOST_TOOLCHAIN sbr:1886578148) # Clang 11.0.0 for linux-x86_64
IF (CUDA_VERSION VERSION_LT "11.2")
# Equivalent to nvcc -allow-unsupported-compiler (present since 11.0).
CFLAGS(GLOBAL "-D__NV_NO_HOST_COMPILER_CHECK")
ENDIF()
ELSEIF(OS_LINUX AND ARCH_AARCH64)
DECLARE_EXTERNAL_RESOURCE(CUDA_HOST_TOOLCHAIN sbr:1886578148) # Clang 11.0.0 for linux-x86_64
ELSE()
ENABLE(CUDA_HOST_COMPILER_NOT_FOUND)
ENDIF()
ELSEIF (HOST_OS_LINUX AND HOST_ARCH_PPC64LE)
IF (OS_LINUX AND ARCH_PPC64LE)
IF (CUDA_VERSION == "10.1")
DECLARE_EXTERNAL_RESOURCE(CUDA_HOST_TOOLCHAIN sbr:1566513994) # Clang 7.0 for Linux ppc64le (not latest)
ELSE()
ENABLE(CUDA_HOST_COMPILER_NOT_FOUND)
ENDIF()
ELSE()
ENABLE(CUDA_HOST_COMPILER_NOT_FOUND)
ENDIF()
ELSEIF (HOST_OS_DARWIN AND HOST_ARCH_X86_64)
IF (OS_DARWIN AND ARCH_X86_64)
SET(__XCODE_RESOURCE_NAME CUDA_HOST_TOOLCHAIN)
IF (CUDA_VERSION == "10.1")
SET(__XCODE_TOOLCHAIN_VERSION "9.2") # (not latest)
ELSE()
SET(__XCODE_TOOLCHAIN_VERSION "")
ENABLE(CUDA_HOST_COMPILER_NOT_FOUND)
ENDIF()
IF (__XCODE_TOOLCHAIN_VERSION)
INCLUDE(${ARCADIA_ROOT}/build/platform/xcode/ya.make.inc)
ENDIF()
ELSE()
ENABLE(CUDA_HOST_COMPILER_NOT_FOUND)
ENDIF()
ELSEIF (HOST_OS_WINDOWS AND HOST_ARCH_X86_64)
IF (OS_WINDOWS AND ARCH_X86_64)
# To create this toolchain, install MSVS on Windows and run:
# devtools/tools_build/pack_sdk.py msvc out.tar
# Note: it will contain patched "VC/Auxiliary/Build/vcvarsall.bat"
# to prevent "nvcc fatal : Host compiler targets unsupported OS."
IF (CUDA_HOST_MSVC_VERSION == "14.28.29910")
DECLARE_EXTERNAL_RESOURCE(CUDA_HOST_TOOLCHAIN sbr:2153212401)
ELSE()
MESSAGE(FATAL_ERROR "Unexpected or unspecified Microsoft Visual C++ CUDA host compiler version")
ENDIF()
ELSE()
ENABLE(CUDA_HOST_COMPILER_NOT_FOUND)
ENDIF()
ELSE()
ENABLE(CUDA_HOST_COMPILER_NOT_FOUND)
ENDIF()
ENDIF()
IF (CUDA_NOT_FOUND)
MESSAGE(FATAL_ERROR "No CUDA Toolkit for the selected platform")
ENDIF()
IF (CUDA_HOST_COMPILER_NOT_FOUND)
MESSAGE(FATAL_ERROR "No CUDA host compiler for the selected platform and CUDA Toolkit version ${CUDA_VERSION}")
ENDIF()
# Use thrust and cub from Arcadia, not from HPC SDK
# NB:
# it would be better to use PEERDIR instead,
# but ymake does not allow PEERDIRs from RESOURCES_LIBRARY.
ADDINCL(
GLOBAL contrib/libs/nvidia/thrust
GLOBAL contrib/libs/nvidia/cub
)
IF (HOST_OS_WINDOWS)
SET_APPEND_WITH_GLOBAL(USER_CFLAGS GLOBAL "\"-I${CUDA_ROOT}/include\"")
ELSE()
CFLAGS(GLOBAL "-I${CUDA_ROOT}/include")
ENDIF()
IF (HOST_OS_WINDOWS)
SET_APPEND(LDFLAGS_GLOBAL "\"/LIBPATH:${CUDA_ROOT}/lib/x64\"")
ELSEIF(HOST_OS_LINUX AND OS_LINUX AND ARCH_AARCH64)
LDFLAGS("-L${CUDA_ROOT}/targets/sbsa-linux/lib")
ELSEIF(HOST_OS_LINUX)
LDFLAGS("-L${CUDA_ROOT}/lib64")
ELSE()
LDFLAGS("-L${CUDA_ROOT}/lib")
ENDIF()
IF (CUDA_REQUIRED)
IF(HOST_OS_LINUX)
LDFLAGS("-L${CUDA_ROOT}/lib64/stubs")
EXTRALIBS(-lcuda)
ELSEIF(HOST_OS_DARWIN)
LDFLAGS("-F${CUDA_ROOT}/lib/stubs -framework CUDA")
ENDIF()
ENDIF()
IF (HOST_OS_WINDOWS)
LDFLAGS(cudadevrt.lib cudart_static.lib)
ELSE()
EXTRALIBS(-lcudadevrt -lcudart_static -lculibos)
ENDIF()
END()
|