@@ -142,76 +142,14 @@ DEPS_SONAME=(
142
142
" libcublasLt.so.11"
143
143
" libgomp.so.1"
144
144
)
145
- elif [[ $CUDA_VERSION == " 11.7" ]]; then
145
+ elif [[ $CUDA_VERSION == " 11.7" || $CUDA_VERSION == " 11.8 " ]]; then
146
146
export USE_STATIC_CUDNN=0
147
147
# Try parallelizing nvcc as well
148
148
export TORCH_NVCC_FLAGS=" -Xfatbin -compress-all --threads 2"
149
149
DEPS_LIST=(
150
- " /usr/local/cuda/lib64/libcudart.so.11.0"
151
- " /usr/local/cuda/lib64/libnvToolsExt.so.1"
152
- " /usr/local/cuda/lib64/libnvrtc.so.11.2" # this is not a mistake for 11.7, it links to 11.7.50
153
- " /usr/local/cuda/lib64/libnvrtc-builtins.so.11.7"
154
150
" $LIBGOMP_PATH "
155
151
)
156
152
DEPS_SONAME=(
157
- " libcudart.so.11.0"
158
- " libnvToolsExt.so.1"
159
- " libnvrtc.so.11.2"
160
- " libnvrtc-builtins.so.11.7"
161
- " libgomp.so.1"
162
- )
163
-
164
- if [[ -z " $PYTORCH_EXTRA_INSTALL_REQUIREMENTS " ]]; then
165
- echo " Bundling with cudnn and cublas."
166
- DEPS_LIST+=(
167
- " /usr/local/cuda/lib64/libcudnn_adv_infer.so.8"
168
- " /usr/local/cuda/lib64/libcudnn_adv_train.so.8"
169
- " /usr/local/cuda/lib64/libcudnn_cnn_infer.so.8"
170
- " /usr/local/cuda/lib64/libcudnn_cnn_train.so.8"
171
- " /usr/local/cuda/lib64/libcudnn_ops_infer.so.8"
172
- " /usr/local/cuda/lib64/libcudnn_ops_train.so.8"
173
- " /usr/local/cuda/lib64/libcudnn.so.8"
174
- " /usr/local/cuda/lib64/libcublas.so.11"
175
- " /usr/local/cuda/lib64/libcublasLt.so.11"
176
- )
177
- DEPS_SONAME+=(
178
- " libcudnn_adv_infer.so.8"
179
- " libcudnn_adv_train.so.8"
180
- " libcudnn_cnn_infer.so.8"
181
- " libcudnn_cnn_train.so.8"
182
- " libcudnn_ops_infer.so.8"
183
- " libcudnn_ops_train.so.8"
184
- " libcudnn.so.8"
185
- " libcublas.so.11"
186
- " libcublasLt.so.11"
187
- )
188
- else
189
- echo " Using cudnn and cublas from pypi."
190
- CUDA_RPATHS=(
191
- ' $ORIGIN/../../nvidia/cublas/lib'
192
- ' $ORIGIN/../../nvidia/cudnn/lib'
193
- )
194
- CUDA_RPATHS=$( IFS=: ; echo " ${CUDA_RPATHS[*]} " )
195
- export C_SO_RPATH=$CUDA_RPATHS ' :$ORIGIN:$ORIGIN/lib'
196
- export LIB_SO_RPATH=$CUDA_RPATHS ' :$ORIGIN'
197
- export FORCE_RPATH=" --force-rpath"
198
- fi
199
- elif [[ $CUDA_VERSION == " 11.8" ]]; then
200
- export USE_STATIC_CUDNN=0
201
- # Try parallelizing nvcc as well
202
- export TORCH_NVCC_FLAGS=" -Xfatbin -compress-all --threads 2"
203
- DEPS_LIST=(
204
- " /usr/local/cuda/lib64/libcudart.so.11.0"
205
- " /usr/local/cuda/lib64/libnvToolsExt.so.1"
206
- " /usr/local/cuda/lib64/libnvrtc.so.11.2" # this is not a mistake for 11.8, it links to 11.8.89
207
- " /usr/local/cuda/lib64/libnvrtc-builtins.so.11.8"
208
- " $LIBGOMP_PATH "
209
- )
210
- DEPS_SONAME=(
211
- " libcudart.so.11.0"
212
- " libnvToolsExt.so.1"
213
- " libnvrtc.so.11.2"
214
- " libnvrtc-builtins.so.11.8"
215
153
" libgomp.so.1"
216
154
)
217
155
@@ -227,6 +165,9 @@ elif [[ $CUDA_VERSION == "11.8" ]]; then
227
165
" /usr/local/cuda/lib64/libcudnn.so.8"
228
166
" /usr/local/cuda/lib64/libcublas.so.11"
229
167
" /usr/local/cuda/lib64/libcublasLt.so.11"
168
+ " /usr/local/cuda/lib64/libcudart.so.11.0"
169
+ " /usr/local/cuda/lib64/libnvToolsExt.so.1"
170
+ " /usr/local/cuda/lib64/libnvrtc.so.11.2" # this is not a mistake, it links to more specific cuda version
230
171
)
231
172
DEPS_SONAME+=(
232
173
" libcudnn_adv_infer.so.8"
@@ -238,17 +179,52 @@ elif [[ $CUDA_VERSION == "11.8" ]]; then
238
179
" libcudnn.so.8"
239
180
" libcublas.so.11"
240
181
" libcublasLt.so.11"
182
+ " libcudart.so.11.0"
183
+ " libnvToolsExt.so.1"
184
+ " libnvrtc.so.11.2"
241
185
)
186
+ if [[ $CUDA_VERSION == " 11.7" ]]; then
187
+ DEPS_LIST+=(
188
+ " /usr/local/cuda/lib64/libnvrtc-builtins.so.11.7"
189
+ )
190
+ DEPS_SONAME+=(
191
+ " libnvrtc-builtins.so.11.7"
192
+ )
193
+ fi
194
+ if [[ $CUDA_VERSION == " 11.8" ]]; then
195
+ DEPS_LIST+=(
196
+ " /usr/local/cuda/lib64/libnvrtc-builtins.so.11.8"
197
+ )
198
+ DEPS_SONAME+=(
199
+ " libnvrtc-builtins.so.11.8"
200
+ )
201
+ fi
242
202
else
243
- echo " Using cudnn and cublas from pypi."
203
+ echo " Using nvidia libs from pypi."
244
204
CUDA_RPATHS=(
245
205
' $ORIGIN/../../nvidia/cublas/lib'
206
+ ' $ORIGIN/../../nvidia/cuda_cupti/lib'
207
+ ' $ORIGIN/../../nvidia/cuda_nvrtc/lib'
208
+ ' $ORIGIN/../../nvidia/cuda_runtime/lib'
246
209
' $ORIGIN/../../nvidia/cudnn/lib'
210
+ ' $ORIGIN/../../nvidia/cufft/lib'
211
+ ' $ORIGIN/../../nvidia/curand/lib'
212
+ ' $ORIGIN/../../nvidia/cusolver/lib'
213
+ ' $ORIGIN/../../nvidia/cusparse/lib'
214
+ ' $ORIGIN/../../nvidia/nccl/lib'
215
+ ' $ORIGIN/../../nvidia/nvtx/lib'
247
216
)
248
217
CUDA_RPATHS=$( IFS=: ; echo " ${CUDA_RPATHS[*]} " )
249
218
export C_SO_RPATH=$CUDA_RPATHS ' :$ORIGIN:$ORIGIN/lib'
250
219
export LIB_SO_RPATH=$CUDA_RPATHS ' :$ORIGIN'
251
220
export FORCE_RPATH=" --force-rpath"
221
+ export USE_STATIC_NCCL=0
222
+ export USE_SYSTEM_NCCL=1
223
+ export ATEN_STATIC_CUDA=0
224
+ export USE_CUDA_STATIC_LINK=0
225
+ export USE_CUPTI_SO=1
226
+ export NCCL_INCLUDE_DIR=" /usr/local/cuda/include/"
227
+ export NCCL_LIB_DIR=" /usr/local/cuda/lib64/"
252
228
fi
253
229
else
254
230
echo " Unknown cuda version $CUDA_VERSION "
0 commit comments