export HOME=/lustre/atlas/proj-shared/fus117/
cd ~wget http://developer.download.nvidia.com/compute/redist/cudnn/v5.1/cudnn-7.5-linux-x64-v5.1.tgz
tar -xvf Add following lines to the submission script:
export LD_LIBRARY_PATH=$HOME/cuda/lib64:$LD_LIBRARY_PATH
export LIBRARY_PATH=$HOME/cuda/lib64:$LIBRARY_PATH
export LDFLAGS=$LDFLAGS:$HOME/cuda/lib64
export INCLUDE=$INCLUDE:$HOME/cuda/include
export CPATH=$CPATH:$HOME/cuda/include
export FFLAGS=$FFLAGS:$HOME/cuda/include
export LOCAL_LDFLAGS=$LOCAL_LDFLAGS:$HOME/cuda/lib64
export LOCAL_INCLUDE=$LOCAL_INCLUDE:$HOME/cuda/include
export LOCAL_CFLAGS=$LOCAL_CFLAGS:$HOME/cuda/include
export LOCAL_FFLAGS=$LOCAL_FFLAGS:$HOME/cuda/include
export LOCAL_CXXFLAGS=$LOCAL_CXXFLAGS:$HOME/cuda/includeModify LIBRARY_PATH and load the CUDA Toolkit:
module load cudatoolkit
export LIBRARY_PATH=/opt/nvidia/cudatoolkit7.5/7.5.18-1.0502.10743.2.1/lib64:$LIBRARY_PATHwget https://repo.continuum.io/archive/Anaconda2-4.3.1-Linux-x86_64.sh
sh A..
Do not add PATH to .bashrc - it messes up modules for some reason.
Copy private SSH key on GitHub to ~/.ssh/ and register the private key:
ssh-add ~/.ssh/olcf_github_rsa
git clone [email protected]:PPPLDeepLearning/plasma-python.git
cd PPPL/plasma-python
Create frnn env:
conda create --name frnn --file requirements.txt
module switch PrgEnv-pgi PrgEnv-gnu
export MPICC=cc
python setup.py install
doing custom installs with pip --user is OK
- Make sure to update paths in the
conf.yaml
The mass batch job submission is performed with this script: https://github.com/PPPLDeepLearning/plasma-python/blob/titan_setup/examples/prepare_pbs_configs_titan.py