-
Notifications
You must be signed in to change notification settings - Fork 18
/
Copy pathmake.sh
70 lines (52 loc) · 2.49 KB
/
make.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
#!/usr/bin/env bash
set -e
TF_INC=$(python -c 'import tensorflow as tf; print(tf.sysconfig.get_include())')
TF_LIB=$(python -c 'import tensorflow as tf; print(tf.sysconfig.get_lib())')
NSYNC_INC=$TF_INC"/external/nsync/public"
# please modify $ARCH according to the following list and your gpu model.
ARCH=sm_52
# If coming across: cudaCheckError() failed : invalid device function. change -arch=sm_xx accordingly.
# Which CUDA capabilities do we want to pre-build for?
# https://developer.nvidia.com/cuda-gpus
# Compute/shader model Cards
# 6.1 P4, P40, Titan X so CUDA_MODEL = 61
# 6.0 P100 so CUDA_MODEL = 60
# 5.2 M40
# 3.7 K80
# 3.5 K40, K20
# 3.0 K10, Grid K520 (AWS G2)
# Other Nvidia shader models should work, but they will require extra startup
# time as the code is pre-optimized for them.
# CUDA_MODELS=30 35 37 52 60 61
if [ "$TF_INC" = "" ]; then
echo "Tensorflow include dir is empty"
return "1"
fi
CUDA_HOME=/usr/local/cuda-10.0/
echo "Configuration variables:"
echo "Tensorflow Include directory: $TF_INC"
echo "Tensorflow Library directory: $TF_LIB"
echo "Nvidia Arch: $ARCH"
read -p "Do you want to continue with the compilation with this configuration (Y/n)?" choice
case "$choice" in
[yY][eE][sS]|y|Y|"" ) CONTINUE="1";;
[nN][oO]|n|N ) CONTINUE="0";;
* ) echo "invalid";;
esac
if [ "$CONTINUE" = "1" ]; then
#if [ ! -f $TF_INC/tensorflow/stream_executor/cuda/cuda_config.h ]; then
#cp ./cuda_config.h $TF_INC/tensorflow/stream_executor/cuda/
cd deform_conv_layer
nvcc -std=c++11 -ccbin=/usr/bin/g++-4.9 -c -o deform_conv.cu.o deform_conv.cu.cc -I $TF_INC -I $NSYNC_INC -D\
GOOGLE_CUDA=1 -x cu -Xcompiler -fPIC -L $CUDA_HOME/lib64 --expt-relaxed-constexpr -arch=$ARCH -DNDEBUG
## if you install tf using already-built binary, or gcc version 4.x, uncomment the three lines below
g++-4.9 -std=c++11 -shared -o deform_conv.so deform_conv.cc deform_conv.cu.o -I\
$TF_INC -I $NSYNC_INC -fPIC -lcudart -L $CUDA_HOME/lib64 -D GOOGLE_CUDA=1 -Wfatal-errors \
-L $TF_LIB -ltensorflow_framework -D_GLIBCXX_USE_CXX11_ABI=0
# for gcc5-built tf
# g++ -std=c++11 -shared -o deform_conv.so deform_conv.cc deform_conv.cu.o \
# -I $TF_INC -I $NSYNC_INC -fPIC -D GOOGLE_CUDA -lcudart -L $CUDA_HOME/lib64 -L $TF_LIB -ltensorflow_framework -D_GLIBCXX_USE_CXX11_ABI=0
cd ..
else
echo "Modify the make.sh file to math your configuration."
fi