Skip to content

Commit 7fbb9d8

Browse files
authored
Cuda 11.6 include libraries like cudnn and others (#1017)
* Manywheel and conda builds for CUDA 11.6 * Fix typo * Correct comment
1 parent 992ca12 commit 7fbb9d8

File tree

2 files changed

+46
-0
lines changed

2 files changed

+46
-0
lines changed

conda/pytorch-nightly/build.sh

+7
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,13 @@ if [[ -n "$build_with_cuda" ]]; then
7171
export USE_STATIC_CUDNN=0
7272
#for cuda 11.5 include all dynamic loading libraries
7373
DEPS_LIST=(/usr/local/cuda/lib64/libcudnn*.so.8 /usr/local/cuda-11.5/extras/CUPTI/lib64/libcupti.so.11.5)
74+
elif [[ $CUDA_VERSION == 11.6* ]]; then
75+
export TORCH_CUDA_ARCH_LIST="$TORCH_CUDA_ARCH_LIST;6.0;6.1;7.0;7.5;8.0;8.6"
76+
#for cuda 11.5 we use cudnn 8.3.2.44 https://docs.nvidia.com/deeplearning/cudnn/release-notes/rel_8.html
77+
#which does not have single static libcudnn_static.a deliverable to link with
78+
export USE_STATIC_CUDNN=0
79+
#for cuda 11.5 include all dynamic loading libraries
80+
DEPS_LIST=(/usr/local/cuda/lib64/libcudnn*.so.8 /usr/local/cuda-11.6/extras/CUPTI/lib64/libcupti.so.11.6)
7481
fi
7582
export NCCL_ROOT_DIR=/usr/local/cuda
7683
export USE_STATIC_NCCL=1 # links nccl statically (driven by tools/setup_helpers/nccl.py, some of the NCCL cmake files such as FindNCCL.cmake and gloo/FindNCCL.cmake)

manywheel/build_cuda.sh

+39
Original file line numberDiff line numberDiff line change
@@ -138,6 +138,8 @@ DEPS_LIST=(
138138
"/usr/local/cuda/lib64/libcudnn_ops_infer.so.8"
139139
"/usr/local/cuda/lib64/libcudnn_ops_train.so.8"
140140
"/usr/local/cuda/lib64/libcudnn.so.8"
141+
"/usr/local/cuda/lib64/libcublas.so.11"
142+
"/usr/local/cuda/lib64/libcublasLt.so.11"
141143
"$LIBGOMP_PATH"
142144
)
143145

@@ -153,6 +155,8 @@ DEPS_SONAME=(
153155
"libcudnn_ops_infer.so.8"
154156
"libcudnn_ops_train.so.8"
155157
"libcudnn.so.8"
158+
"libcublas.so.11"
159+
"libcublasLt.so.11"
156160
"libgomp.so.1"
157161
)
158162
elif [[ $CUDA_VERSION == "11.5" ]]; then
@@ -189,6 +193,41 @@ DEPS_SONAME=(
189193
"libcublasLt.so.11"
190194
"libgomp.so.1"
191195
)
196+
elif [[ $CUDA_VERSION == "11.6" ]]; then
197+
export USE_STATIC_CUDNN=0
198+
DEPS_LIST=(
199+
"/usr/local/cuda/lib64/libcudart.so.11.0"
200+
"/usr/local/cuda/lib64/libnvToolsExt.so.1"
201+
"/usr/local/cuda/lib64/libnvrtc.so.11.2" # this is not a mistake for 11.6
202+
"/usr/local/cuda/lib64/libnvrtc-builtins.so.11.6"
203+
"/usr/local/cuda/lib64/libcudnn_adv_infer.so.8"
204+
"/usr/local/cuda/lib64/libcudnn_adv_train.so.8"
205+
"/usr/local/cuda/lib64/libcudnn_cnn_infer.so.8"
206+
"/usr/local/cuda/lib64/libcudnn_cnn_train.so.8"
207+
"/usr/local/cuda/lib64/libcudnn_ops_infer.so.8"
208+
"/usr/local/cuda/lib64/libcudnn_ops_train.so.8"
209+
"/usr/local/cuda/lib64/libcudnn.so.8"
210+
"/usr/local/cuda/lib64/libcublas.so.11"
211+
"/usr/local/cuda/lib64/libcublasLt.so.11"
212+
"$LIBGOMP_PATH"
213+
)
214+
DEPS_SONAME=(
215+
"libcudart.so.11.0"
216+
"libnvToolsExt.so.1"
217+
"libnvrtc.so.11.2"
218+
"libnvrtc-builtins.so.11.6"
219+
"libcudnn_adv_infer.so.8"
220+
"libcudnn_adv_train.so.8"
221+
"libcudnn_cnn_infer.so.8"
222+
"libcudnn_cnn_train.so.8"
223+
"libcudnn_ops_infer.so.8"
224+
"libcudnn_ops_train.so.8"
225+
"libcudnn.so.8"
226+
"libcublas.so.11"
227+
"libcublasLt.so.11"
228+
"libgomp.so.1"
229+
)
230+
192231

193232
# Try parallelizing nvcc as well
194233
export TORCH_NVCC_FLAGS="-Xfatbin -compress-all --threads 2"

0 commit comments

Comments
 (0)