Thanks. Below is our current build script. It seems like this is giving some improved performance. Based on these settings, do you have any other advice / suggested changes?
#!/bin/bash
module load mkl/2020.0
module load intel/19.0.4
module load impi/2019.8
export NWCHEM_TOP=$(pwd)
export NWCHEM_TARGET=LINUX64
export USE_MPI=y
export USE_MPIF=y
export USE_MPIF4=y
export ARMCI_NETWORK=MPI-PR
export PSM2_MEMORY=large
export HAS_BLAS=y
export BLAS_SIZE=8
export BLASOPT="-L${MKLROOT}/lib/intel64 -lmkl_intel_ilp64 -lmkl_intel_thread -lmkl_core -liomp5 -lpthread -lm -ldl"
export HAS_LAPACK=y
export USE_LAPACK=y
export LAPACK_SIZE=8
export LAPACK_LIB="$BLASOPT"
export LAPACK_LIBS="$BLASOPT"
export LAPACKOPT="$BLASOPT"
export HAS_SCALAPACK=y
export USE_SCALAPACK=y
export SCALAPACK_SIZE=8
export SCALAPACK="-L${MKLROOT}/lib/intel64 -lmkl_scalapack_ilp64 -lmkl_intel_ilp64 -lmkl_intel_thread -lmkl_core -lmkl_blacs_intelmpi_ilp64 -liomp5 -lpthread -lm -ldl"
export SCALAPACK_LIB="$SCALAPACK"
export SCALAPACK_LIBS="$SCALAPACK"
export NWCHEM_MODULES=all
export NWCHEM_LONG_PATHS=y
export USE_NOFSCHECK=y
export LARGE_FILES=y
export USE_OPENMP=y
#export PYTHONHOME=/usr
#export PYTHONVERSION=2.7
#export PYTHONLIBTYPE=so
#export USE_PYTHON64=y
#export MPI_LOC="/usr/tce/packages/impi/impi-2019.8-intel-19.0.4/"
#export MPI_INCLUDE="$MPI_LOC/include/gfortran/9.1.0 -I$MPI_LOC/include"
#export MPI_LIB="$MPI_LOC/lib/release_mt -L$MPI_LOC/lib"
#export LIBMPI="-lmpifort -lmpi -lmpigi -ldl -lrt -lpthread"
#export CC=icc
export FC=ifort
export USE_64TO32=y
cd $NWCHEM_TOP/src
#make -j realclean
make -j nwchem_config
make -j 64_to_32
make -j FC=ifort
cd $NWCHEM_TOP/src/tools
make -j FC=ifort version
make -j FC=ifort
cd $NWCHEM_TOP/src
make -j FC=ifort link