-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathSingularity20210202
122 lines (116 loc) · 5.37 KB
/
Singularity20210202
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
Bootstrap:docker
From:nvcr.io/nvidia/cuda:11.1.1-cudnn8-devel-centos8
%environment
export KERAS_BACKEND=tensorflow
export PATH=/usr/local/cuda/bin:$PATH
export LD_LIBRARY_PATH=/usr/local/cuda-11.0/lib64:/usr/local/cuda-11.1/lib64:/usr/local/cuda-11.2/lib64
%files
nv-tensorrt-repo-rhel7-cuda11.1-trt7.2.2.3-ga-20201211-1-1.x86_64.rpm
%post
# General Python packages
CUDA_VERSION=11-1
NVML_VERSION=7
#old numpy restrictions <1.19.0,>=1.16.0
PYTHON3_PACKAGES="setuptools>=41.0.0 keras pillow scikit-learn pandas pandas_ml matplotlib>=3.0.0 mxnet mlxtend tensorboard jupyter jupyterlab"
yum install -y epel-release dnf-plugins-core
curl https://copr.fedorainfracloud.org/coprs/vbatts/bazel/repo/epel-7/vbatts-bazel-epel-8.repo -o /etc/yum.repos.d/vbatts-bazel-epel-8.repo
yum clean all && yum makecache
dnf config-manager -y --set-enabled powertools
yum install -y @"Development Tools"
yum install -y libgomp cmake3 vim git
yum install -y http://developer.download.nvidia.com/compute/machine-learning/repos/rhel8/x86_64/nvidia-machine-learning-repo-rhel8-1.0.0-1.x86_64.rpm
# misc cuda stuff
#dnf install -y libcublas-devel-* libcublas-*
yum install -y libcublas-devel-$CUDA_VERSION libcublas-$CUDA_VERSION libcufft-$CUDA_VERSION libcufft-devel-$CUDA_VERSION libcurand-$CUDA_VERSION libcurand-devel-$CUDA_VERSION libcusolver-$CUDA_VERSION libcusolver-devel-$CUDA_VERSION libcusparse-$CUDA_VERSION libcusparse-devel-$CUDA_VERSION
#yum install -y libcufft-* libcufft-devel-* libcurand-* libcurand-devel* libcusolver-* libcusolver-devel* libcusparse-* libcusparse-devel-*
yum install -y nv-tensorrt-repo-rhel7-cuda11.1-trt7.2.2.3-ga-20201211-1-1.x86_64.rpm
yum search libnvinfer
yum install -y libnvinfer$NVML_VERSION libnvinfer-plugin$NVML_VERSION libnvparsers$NVML_VERSION libnvonnxparsers$NVML_VERSION libnvinfer-plugin-devel libnvinfer-devel python3-libnvinfer python3-libnvinfer-devel
yum install -y git gcc gcc-c++ sudo curl openblas lapack python3 wget openssl-devel curl-devel libxml2 libxml2-devel python3-devel
alternatives --set python /usr/bin/python3
cd /usr/bin
curl -fL https://releases.bazel.build/3.1.0/release/bazel-3.1.0-linux-x86_64 -o bazel
chmod +x bazel
cd /
# Install all the python bits
wget https://bootstrap.pypa.io/get-pip.py
python3 get-pip.py
#do tensorflow build here
python3 -m pip install numpy wheel
python3 -m pip install keras_preprocessing --no-deps
git clone https://github.com/tensorflow/tensorflow.git
cd tensorflow
git checkout r2.4
export TF_NEED_TENSORRT=1
export TF_NEED_CUDA=1
export TF_CUDA_COMPUTE_CAPABILITIES=6.1,7.0,7.5,8.0
export TF_CUDA_VERSION="$(/usr/local/cuda/bin/nvcc --version | sed -n 's/^.*release \(.*\),.*/\1/p')"
export TF_NEED_JEMALLOC=1
export TF_CUDNN_VERSION="$(sed -n 's/^#define CUDNN_MAJOR\s*\(.*\).*/\1/p' /usr/include/cudnn.h)"
export TF_NCCL_VERSION=2.8.3
export TF_NEED_GCP=0
export TF_NEED_MPI=0
export TF_NEED_HDFS=0
export TF_NEED_OPENCL=0
export TF_ENABLE_XLA=0
export TF_NEED_VERBS=0
export TF_CUDA_CLANG=0
export TF_NEED_MKL=0
export TF_DOWNLOAD_MKL=0
export TF_NEED_AWS=0
export TF_NEED_MPI=0
export TF_NEED_GDR=0
export TF_NEED_S3=0
export TF_NEED_OPENCL_SYCL=0
export TF_SET_ANDROID_WORKSPACE=0
export TF_NEED_COMPUTECPP=0
export TF_NEED_KAFKA=0
export GCC_HOST_COMPILER_PATH=$(which gcc)
export CC_OPT_FLAGS="-march=avx2"
./configure
bazel build --config=cuda //tensorflow/tools/pip_package:build_pip_package
./bazel-bin/tensorflow/tools/pip_package/build_pip_package ./output/tf/
python3 -m pip install ./output/tf/*.whl
cd /
rm -rf /tensorflow
#end tensorflow build
python3 -m pip install $PYTHON3_PACKAGES
# install R
## Turn off nodoc as that ruins R apparently
# sed -i 's/tsflags=nodocs//g' /etc/yum.conf
# or use --setopt=tsflags= to do it per invocation
#dnf config-manager --set-enabled PowerTools
yum install -y --setopt=tsflags= R-core
yum install -y R-core-devel R-devel R-Rcpp R-Rcpp-devel
# R packages
R --no-save <<EOL
install.packages("pkgbuild", repos="https://mirror.las.iastate.edu/CRAN/")
install.packages("devtools", repos="https://mirror.las.iastate.edu/CRAN/")
#options(devtools.install.args = c("--no-multiarch", "--no-test-load", "--no-html","--nodoc"))
#install.packages("tidyselect", repos="https://mirror.las.iastate.edu/CRAN/")
library(devtools)
devtools::install_github("rstudio/tensorflow")
library(tensorflow)
try(devtools::install_github("rstudio/keras"))
library(keras)
EOL
# Pytorch stuff
python3 -m pip install torch torchvision
#hacky library BS to support cuda 11 while providing "10.1" libs
#ln -s /usr/local/cuda/lib64/libcudart.so.11.0 /usr/local/cuda/lib64/libcudart.so.10.1
#ln -s /usr/local/cuda/lib64/libcublas.so.11 /usr/local/cuda/lib64/libcublas.so.10
#ln -s /usr/local/cuda/lib64/libcusparse.so.11 /usr/local/cuda/lib64/libcusparse.so.10
ln -s /usr/lib64/libcudnn.so.8 /usr/lib64/libcudnn.so.7
ln -s /usr/lib64/libcudnn_adv_infer.so.8 /usr/lib64/libcudnn_adv_infer.so.7
ln -s /usr/lib64/libcudnn_adv_train.so.8 /usr/lib64/libcudnn_adv_train.so.7
ln -s /usr/lib64/libcudnn_cnn_infer.so.8 /usr/lib64/libcudnn_cnn_infer.so.7
ln -s /usr/lib64/libcudnn_cnn_train.so.8 /usr/lib64/libcudnn_cnn_train.so.7
ln -s /usr/lib64/libcudnn_ops_infer.so.8 /usr/lib64/libcudnn_ops_infer.so.7
ln -s /usr/lib64/libcudnn_ops_train.so.8 /usr/lib64/libcudnn_ops_train.so.7
#cleanup
yum remove -y nv-tensorrt-repo-rhel7-cuda11.1-trt7.2.2.3-ga-20201211
yum clean all
rm -rf /var/cache/dnf/*
rm -f nv-tensorrt-repo-rhel7-cuda11.1-trt7.2.2.3-ga-20201211-1-1.x86_64.rpm
%runscript
exec $@