# gpu
module load cuda/11.1.1
module load nvhpc/22.1
module load openmpi/4.0.5-nvhpc22.1
module load aocl/3.1.0
# module load openblas/0.3.12-gcc10.2.0
# top directory of the NWChem source tree
export NWCHEM_TOP=/ocean/projects/cis210088p/sst/NWChem/gpu_ompi_ARMCI_MPI/nwchem
# your target platform
export NWCHEM_TARGET=LINUX64
export ARMCI_NETWORK=ARMCI-MPI
# General configurations
export USE_MPI=y
export USE_OPENMP=1
export NWCHEM_MODULES=qm
# export BLASOPT="-mkl"
# export BLASOPT="-lcublas"
export BLASOPT="-lblis"
export BLAS_SIZE=8
# export LAPACK_LIB="-lcublas"
export LAPACK_LIB="-lblis -llapack"
export USE_SCALAPACK=y
#! Remember to change
# export SCALAPACK="-lcublas"
export SCALAPACK="-lblis -lscalapack"
# export SCALAPACK="-mkl -lmkl_scalapack_ilp64 -lmkl_blacs_intelmpi_ilp64"
export SCALAPACK_SIZE=8
# For GPU
export FC=nvfortran
export USE_F90_ALLOCATABLE=1
export USE_OPENACC_TRPDRV=1
export NWCHEM_LINK_CUDA=1
# export DEV_GA=1 # optional
export MA_USE_CUDA_MEM=1
export TCE_CUDA=Y
export CUDA=nvcc
export CUDA_LIBS="-L/jet/packages/spack/opt/spack/linux-centos8-zen/gcc-8.3.1/cuda-10.2.89-kz7u4ix6ed53nioz4ycqin3kujcim3bs/lib64/ -lcudart"
export CUDA_FLAGS="-arch sm_70 "
export CUDA_ARCH="-arch sm70"
export CUDA_INCLUDE="-I/jet/packages/spack/opt/spack/linux-centos8-zen/gcc-8.3.1/cuda-10.2.89-kz7u4ix6ed53nioz4ycqin3kujcim3bs/include"
# export OMP_NUM_THREADS=
module load nvhpc/22.1