@@ -147,13 +147,9 @@ elif [[ $CUDA_VERSION == "11.7" ]]; then
147
147
# Try parallelizing nvcc as well
148
148
export TORCH_NVCC_FLAGS=" -Xfatbin -compress-all --threads 2"
149
149
DEPS_LIST=(
150
- " /usr/local/cuda/lib64/libcudart.so.11.0"
151
- " /usr/local/cuda/lib64/libnvToolsExt.so.1"
152
150
" $LIBGOMP_PATH "
153
151
)
154
152
DEPS_SONAME=(
155
- " libcudart.so.11.0"
156
- " libnvToolsExt.so.1"
157
153
" libgomp.so.1"
158
154
)
159
155
@@ -171,6 +167,8 @@ elif [[ $CUDA_VERSION == "11.7" ]]; then
171
167
" /usr/local/cuda/lib64/libcublasLt.so.11"
172
168
" /usr/local/cuda/lib64/libnvrtc.so.11.2" # this is not a mistake for 11.7, it links to 11.7.50
173
169
" /usr/local/cuda/lib64/libnvrtc-builtins.so.11.7"
170
+ " /usr/local/cuda/lib64/libcudart.so.11.0"
171
+ " /usr/local/cuda/lib64/libnvToolsExt.so.1"
174
172
)
175
173
DEPS_SONAME+=(
176
174
" libcudnn_adv_infer.so.8"
@@ -184,21 +182,33 @@ elif [[ $CUDA_VERSION == "11.7" ]]; then
184
182
" libcublasLt.so.11"
185
183
" libnvrtc.so.11.2"
186
184
" libnvrtc-builtins.so.11.7"
185
+ " libcudart.so.11.0"
186
+ " libnvToolsExt.so.1"
187
187
)
188
188
else
189
- echo " Using cudnn, cublas, nccl, and nvrtc from pypi."
189
+ echo " Using nvidia libs from pypi."
190
190
CUDA_RPATHS=(
191
191
' $ORIGIN/../../nvidia/cublas/lib'
192
+ ' $ORIGIN/../../nvidia/cuda_cupti/lib'
192
193
' $ORIGIN/../../nvidia/cuda_nvrtc/lib'
194
+ ' $ORIGIN/../../nvidia/cuda_runtime/lib'
193
195
' $ORIGIN/../../nvidia/cudnn/lib'
196
+ ' $ORIGIN/../../nvidia/cufft/lib'
197
+ ' $ORIGIN/../../nvidia/curand/lib'
198
+ ' $ORIGIN/../../nvidia/cusolver/lib'
199
+ ' $ORIGIN/../../nvidia/cusparse/lib'
194
200
' $ORIGIN/../../nvidia/nccl/lib'
201
+ ' $ORIGIN/../../nvidia/nvtx/lib'
195
202
)
196
203
CUDA_RPATHS=$( IFS=: ; echo " ${CUDA_RPATHS[*]} " )
197
204
export C_SO_RPATH=$CUDA_RPATHS ' :$ORIGIN:$ORIGIN/lib'
198
205
export LIB_SO_RPATH=$CUDA_RPATHS ' :$ORIGIN'
199
206
export FORCE_RPATH=" --force-rpath"
200
207
export USE_STATIC_NCCL=0
201
208
export USE_SYSTEM_NCCL=1
209
+ export ATEN_STATIC_CUDA=0
210
+ export USE_CUDA_STATIC_LINK=0
211
+ export USE_CUPTI_SO=1
202
212
fi
203
213
else
204
214
echo " Unknown cuda version $CUDA_VERSION "
0 commit comments