Fix cuda install #139
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: ParFlow CI Test | |
on: [push, pull_request] | |
jobs: | |
style-check: | |
runs-on: ubuntu-22.04 | |
name: Check Style | |
steps: | |
- name: Checkout commit | |
uses: actions/checkout@v4 | |
- name: Package Install | |
uses: awalsh128/cache-apt-pkgs-action@latest | |
with: | |
packages: curl cmake build-essential tcl-dev tk-dev | |
version: 1.0 | |
execute_install_scripts: true | |
- name: Cache dependencies | |
uses: actions/cache@v4 | |
id: cache-parflow-style-dependencies | |
env: | |
cache-name: cache-parflow-style-dependencies | |
cache-parflow-style-hit: ${{steps.cache-parflow-style-dependencies.outputs.cache-hit}} | |
with: | |
path: "~/depend" | |
key: cache-check-style-${{ secrets.CACHE_VERSION }} | |
- name: Directory Setup | |
run: | | |
mkdir -p $HOME/install | |
# Set necessary vars | |
PARFLOW_DIR="$HOME/install" | |
PARFLOW_DEP_DIR="$HOME/depend" | |
LD_LIBRARY_PATH=${PARFLOW_DEP_DIR}/lib64:${PARFLOW_DEP_DIR}/lib | |
# Create folders | |
mkdir -p ${PARFLOW_DIR} ${PARFLOW_DEP_DIR}/{include,lib} | |
# Verify if paths were correctly set | |
echo "PARFLOW_DIR=${PARFLOW_DIR}" | |
echo "PARFLOW_DEP_DIR=${PARFLOW_DEP_DIR}" | |
echo "LD_LIBRARY_PATH=${LD_LIBRARY_PATH}" | |
# Vars pushed to GITHUB_ENV take effect only on the next CI steps. | |
echo "PARFLOW_DIR=${PARFLOW_DIR}" >> $GITHUB_ENV | |
echo "PARFLOW_DEP_DIR=${PARFLOW_DEP_DIR}" >> $GITHUB_ENV | |
echo "LD_LIBRARY_PATH=${LD_LIBRARY_PATH}" >> $GITHUB_ENV | |
echo "$HOME/depend/bin" >> $GITHUB_PATH | |
echo "$PARFLOW_DIR/bin" >> $GITHUB_PATH | |
- name: Build Uncrustify | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-style-dependencies.outputs.cache-hit}} | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
echo "cache-check-style-${{ secrets.CACHE_VERSION }}" > $HOME/depend/cache-key | |
curl -L -o uncrustify-0.79.0.tar.gz https://github.com/uncrustify/uncrustify/archive/uncrustify-0.79.0.tar.gz | |
tar -xf uncrustify-0.79.0.tar.gz | |
cd uncrustify-uncrustify-0.79.0 | |
mkdir build | |
cd build | |
cmake -DCMAKE_INSTALL_PREFIX=/usr/local .. | |
make | |
sudo make -j 2 install | |
cd ../.. | |
rm -fr uncrustify-uncrustify-0.79.0 uncrustify-0.79.0.tar.gz | |
fi | |
- name: CMake Install | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-style-dependencies.outputs.cache-hit}} | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
echo "Installing" | |
mkdir -p $HOME/depend/{include,lib} | |
cd $HOME/depend | |
echo "cache-${{ matrix.config.os }}-${{ matrix.config.backend }}-${{ secrets.CACHE_VERSION }}" > $HOME/depend/cache-key | |
wget -nv --no-check-certificate https://github.com/Kitware/CMake/releases/download/v3.25.1/cmake-3.25.1-linux-x86_64.tar.gz | |
tar -xf cmake-3.25.1-linux-x86_64.tar.gz | |
$HOME/depend/cmake-3.25.1-linux-x86_64/bin/cmake --version | |
echo "$HOME/depend/cmake-3.25.1-linux-x86_64/bin" >> $GITHUB_PATH | |
fi | |
- name: ParFlow CMake Configure | |
run: | | |
cmake -Bbuild -DPARFLOW_ENABLE_PYTHON=ON -DCMAKE_INSTALL_PREFIX=$PARFLOW_DIR | |
- name: ParFlow CMake Build | |
run: (cd build; make -j 2 install) | |
- name: Run Uncrustify | |
run: | | |
./bin/pfformat --check | |
build: | |
name: ${{ matrix.config.name }} | |
runs-on: ${{ matrix.config.os }} | |
strategy: | |
# fail-fast: true | |
matrix: | |
config: | |
- { | |
name: "Ubuntu 24.04 GCC", | |
os: ubuntu-24.04, | |
cudaos: 'ubuntu2404', | |
cc: "gcc", cxx: "g++", fc: "gfortran", | |
python: "false", | |
backend: "none", | |
amps_layer: mpi1, | |
netcdf: "true" | |
} | |
- { | |
name: "Ubuntu 24.04 LLVM", | |
os: ubuntu-24.04, | |
cudaos: 'ubuntu2404', | |
cc: "clang-18", cxx: "clang++-18", fc: "gfortran", | |
python: "false", | |
backend: "none", | |
amps_layer: mpi1, | |
netcdf: "true" | |
} | |
- { | |
name: "Ubuntu 22.04 GCC Python", | |
os: ubuntu-22.04, | |
cudaos: 'ubuntu2204', | |
cc: "gcc", cxx: "g++", fc: "gfortran", | |
python: "true", | |
backend: "none", | |
amps_layer: mpi1, | |
netcdf: "true" | |
} | |
- { | |
name: "Ubuntu 20.04 GCC Python", | |
os: ubuntu-20.04, | |
cudaos: 'ubuntu2004', | |
cc: "gcc", cxx: "g++", fc: "gfortran", | |
python: "true", | |
backend: "none", | |
amps_layer: mpi1, | |
netcdf: "false" | |
} | |
- { | |
name: "Ubuntu 22.04 GCC OMP", | |
os: ubuntu-22.04, | |
cudaos: 'ubuntu2204', | |
cc: "gcc", cxx: "g++", fc: "gfortran", | |
python: "false", | |
backend: "omp", | |
amps_layer: mpi1, | |
netcdf: "false" | |
} | |
- { | |
name: "Ubuntu 24.04 LLVM OASIS3-MCT Build", | |
os: ubuntu-24.04, | |
cudaos: 'ubuntu2204', | |
cc: "clang-18", cxx: "clang++-18", fc: "gfortran", | |
python: "false", | |
backend: "omp", | |
amps_layer: oas3, | |
netcdf: "true" | |
} | |
- { | |
name: "Ubuntu 24.04 GCC CUDA Build", | |
os: ubuntu-24.04, | |
cc: "gcc", cxx: "g++", fc: "gfortran", | |
python: "false", | |
backend: "cuda", | |
cudaos: 'ubuntu2204', | |
amps_layer: mpi1, | |
netcdf: "false" | |
} | |
- { | |
name: "Ubuntu 24.04 GCC Kokkos Build", | |
os: ubuntu-24.04, | |
cc: "gcc", cxx: "g++", fc: "gfortran", | |
python: "false", | |
backend: "kokkos", | |
cudaos: 'ubuntu2204', | |
amps_layer: mpi1, | |
netcdf: "false" | |
} | |
steps: | |
- uses: actions/checkout@v4 | |
- name: Package Install | |
uses: awalsh128/cache-apt-pkgs-action@latest | |
with: | |
packages: gfortran hdf5-helpers tcl-dev tk-dev libcurl4 libcurl4-gnutls-dev | |
version: 1.0 | |
execute_install_scripts: true | |
- name: HDF5 and OpenMPI Install on Ubuntu 22.04 | |
if: matrix.config.os == 'ubuntu-20.04' || matrix.config.os == 'ubuntu-22.04' | |
run: | | |
sudo apt-get -qq update | |
sudo apt -qq install libhdf5-openmpi-103 libhdf5-openmpi-dev | |
# libhdf5-openmpi-103 has been renamed in Ubuntu 24.04. | |
- name: HDF5 and OpenMPI Install on Ubuntu 24.04 | |
if: matrix.config.os == 'ubuntu-24.04' | |
run: | | |
sudo apt-get -qq update | |
sudo apt -qq install libhdf5-openmpi-103-1t64 libhdf5-openmpi-dev | |
- name: LLVM 18.X Install | |
if: matrix.config.cc == 'clang-18' | |
run: | | |
sudo apt -qq install clang-18 libomp-18-dev | |
- name: Python Package Install | |
if: matrix.config.python == 'true' | |
run: | | |
sudo apt-get -qq update | |
sudo apt -qq install python3 python3-venv | |
# Cache dependencies so don't have to rebuild on each test. | |
# Can flush caches by resetting the CACHE_VERSION secret on GitHub | |
# settings for the project (using date-timestamp for secret). | |
- name: Cache dependencies | |
uses: actions/cache@v4 | |
id: cache-parflow-dependencies | |
env: | |
cache-name: cache-parflow-dependencies | |
cache-parflow-hit: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
with: | |
path: "~/depend" | |
key: cache-${{ matrix.config.os }}-${{ matrix.config.backend }}-${{ secrets.CACHE_VERSION }} | |
- name: Directory Setup | |
run: | | |
mkdir -p $HOME/install | |
# Set necessary vars | |
PARFLOW_DIR="$HOME/install" | |
PARFLOW_DEP_DIR="$HOME/depend" | |
LD_LIBRARY_PATH=${PARFLOW_DEP_DIR}/lib64:${PARFLOW_DEP_DIR}/lib | |
# Create folders | |
mkdir -p ${PARFLOW_DIR} ${PARFLOW_DEP_DIR}/{include,lib} | |
# Verify if paths were correctly set | |
echo "PARFLOW_DIR=${PARFLOW_DIR}" | |
echo "PARFLOW_DEP_DIR=${PARFLOW_DEP_DIR}" | |
echo "LD_LIBRARY_PATH=${LD_LIBRARY_PATH}" | |
# Vars pushed to GITHUB_ENV take effect only on the next CI steps. | |
echo "PARFLOW_DIR=${PARFLOW_DIR}" >> $GITHUB_ENV | |
echo "PARFLOW_DEP_DIR=${PARFLOW_DEP_DIR}" >> $GITHUB_ENV | |
echo "LD_LIBRARY_PATH=${LD_LIBRARY_PATH}" >> $GITHUB_ENV | |
echo "$HOME/depend/bin" >> $GITHUB_PATH | |
echo "$PARFLOW_DIR/bin" >> $GITHUB_PATH | |
- name: Configure OpenMPI backend compiler | |
run: | | |
export OMPI_CC=${{ matrix.config.cc }} | |
export OMPI_CXX=${{ matrix.config.cxx }} | |
export OMPI_FC=${{ matrix.config.fc }} | |
echo "OMPI_CC=${{ matrix.config.cc }}" >> $GITHUB_ENV | |
echo "OMPI_CXX=${{ matrix.config.cxx }}" >> $GITHUB_ENV | |
echo "OMPI_FC=${{ matrix.config.fc }}" >> $GITHUB_ENV | |
echo " mpicc: $(mpicc --version | head -n 1)" | |
echo " mpicxx: $(mpicxx --version | head -n 1)" | |
echo "mpifort: $(mpifort --version | head -n 1)" | |
- name: CMake Install | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
echo "Installing CMake v3.26.5" | |
cd $HOME/depend | |
echo "cache-${{ matrix.config.os }}-${{ matrix.config.backend }}-${{ secrets.CACHE_VERSION }}" > $HOME/depend/cache-key | |
wget -nv --no-check-certificate https://github.com/Kitware/CMake/releases/download/v3.26.5/cmake-3.26.5-linux-x86_64.tar.gz | |
tar -xf cmake-3.26.5-linux-x86_64.tar.gz | |
$HOME/depend/cmake-3.26.5-linux-x86_64/bin/cmake --version | |
fi | |
echo "$HOME/depend/cmake-3.26.5-linux-x86_64/bin" >> $GITHUB_PATH | |
- name: NVidia Driver Install | |
if: matrix.config.backend == 'cuda' || matrix.config.backend == 'kokkos' | |
run: | | |
sudo add-apt-repository -y ppa:graphics-drivers | |
sudo apt-get update -qq | |
sudo apt-get install -y nvidia-driver-535 | |
- name: CUDA Install | |
if: matrix.config.backend == 'cuda' || matrix.config.backend == 'kokkos' | |
run: | | |
export CUDA_VERSION_MAJOR_MINOR=12.4.0 | |
export CUDA_SHORT=12.4 | |
export CUDA_OS=${{ matrix.config.cudaos }} | |
./bin/install-cuda.sh | |
export CUDA_HOME=/usr/local/cuda-${CUDA_SHORT} | |
echo "CUDA_HOME=${CUDA_HOME}" >> $GITHUB_ENV | |
export LD_LIBRARY_PATH=${CUDA_HOME}/lib64:${LD_LIBRARY_PATH} | |
echo "LD_LIBRARY_PATH=${LD_LIBRARY_PATH}" >> $GITHUB_ENV | |
export LIBRARY_PATH=${CUDA_HOME}/lib64/stubs | |
echo "LIBRARY_PATH=${LIBRARY_PATH}" >> $GITHUB_ENV | |
echo "${CUDA_HOME}/bin" >> $GITHUB_PATH | |
- name: UCX | |
if: matrix.config.backend == 'cuda' || matrix.config.backend == 'kokkos' | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
sudo apt install -qq -y autoconf automake libtool | |
URL=https://github.com/openucx/ucx/releases/download/v1.17.0/ucx-1.17.0.tar.gz | |
mkdir ucx | |
cd ucx | |
curl -L $URL | tar --strip-components=1 -xz | |
./contrib/configure-release --with-cuda=$CUDA_HOME --with-java=no --with-go=no --disable-numa --prefix=$PARFLOW_DEP_DIR | |
make -j 2 install | |
fi | |
- name: RMM Install | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
if: matrix.config.backend == 'cuda' || matrix.config.backend == 'kokkos' | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
git clone --branch main --single-branch --recurse-submodules https://github.com/rapidsai/rmm.git | |
cd rmm | |
mkdir build | |
cd build | |
cmake .. -DCMAKE_INSTALL_PREFIX=$PARFLOW_DEP_DIR/rmm | |
make -j | |
make install | |
fi | |
echo "RMM_FLAGS=-Drmm_ROOT=$PARFLOW_DEP_DIR/rmm" >> $GITHUB_ENV | |
- name: Kokkos Install | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
if: matrix.config.backend == 'kokkos' | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
URL=https://github.com/kokkos/kokkos/archive/refs/tags/4.2.01.tar.gz | |
mkdir kokkos | |
cd kokkos | |
curl -L $URL | tar --strip-components=1 -xz | |
mkdir build | |
cd build | |
cmake .. -DCMAKE_CXX_COMPILER=$(pwd)/../bin/nvcc_wrapper -DCMAKE_INSTALL_PREFIX=$PARFLOW_DEP_DIR -DKokkos_ENABLE_CUDA=On -DKokkos_ENABLE_CUDA_LAMBDA=On -DKokkos_ENABLE_CUDA_UVM=On -DKokkos_ARCH_VOLTA70=On | |
make -j 2 install | |
fi | |
echo "KOKKOS_FLAGS=-DKOKKOS_ROOT=$PARFLOW_DEP_DIR" >> $GITHUB_ENV | |
- name: OpenMPI Install for CUDA | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
if: matrix.config.backend == 'cuda' || matrix.config.backend == 'kokkos' | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
URL=https://download.open-mpi.org/release/open-mpi/v4.0/openmpi-4.0.3.tar.gz | |
mkdir openmpi | |
cd openmpi | |
curl -L $URL | tar --strip-components=1 -xz | |
./configure --with-cuda=$CUDA_HOME --with-ucx=$PARFLOW_DEP_DIR --prefix=$PARFLOW_DEP_DIR | |
sudo make -j 2 install | |
cd .. | |
fi | |
sudo ldconfig | |
# Package netcdf is missing features needed by the ParFlow writers, build from source | |
# netcdf is True when we want to build the PF NetCDF writer. OASIS is using the Fortran interface | |
# which is currently not built here. This is currently incompatible with the OASIS build which uses the NetCDF packages. | |
- name: NetCDF Install | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
if: matrix.config.netcdf == 'true' | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
URL=https://github.com/Unidata/netcdf-c/archive/v4.9.0.tar.gz | |
mkdir netcdf-c | |
cd netcdf-c | |
curl -L $URL | tar --strip-components=1 -xz | |
CC=mpicc CPPFLAGS=-I/usr/include/hdf5/openmpi LDFLAGS=-L/usr/lib/x86_64-linux-gnu/hdf5/openmpi ./configure --prefix=$PARFLOW_DEP_DIR | |
make | |
make install | |
cd .. | |
URL=https://github.com/Unidata/netcdf-fortran/archive/v4.5.4.tar.gz | |
mkdir netcdf-fortran | |
cd netcdf-fortran | |
curl -L $URL | tar --strip-components=1 -xz | |
CC=mpicc FC=mpifort CPPFLAGS=-I${PARFLOW_DEP_DIR}/include LDFLAGS=-L${PARFLOW_DEP_DIR}/lib ./configure --prefix=${PARFLOW_DEP_DIR} | |
make | |
make install | |
fi | |
echo "NETCDF_FLAGS=-DNETCDF_DIR=$PARFLOW_DEP_DIR -DNETCDF_Fortran_ROOT=$PARFLOW_DEP_DIR -DPARFLOW_ENABLE_HDF5=TRUE" >> $GITHUB_ENV | |
- name: OASIS3-MCT Install | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
if: matrix.config.amps_layer == 'oas3' | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
git clone --depth 1 --branch OASIS3-MCT_5.1 https://gitlab.com/cerfacs/oasis3-mct.git | |
cd oasis3-mct | |
export OASIS_ROOT=$(pwd) | |
cd util/make_dir | |
echo 'include $(GITHUB_WORKSPACE)/misc/build_scripts/build.oasis3.ubuntu22.04' > make.inc | |
make realclean static-libs -f TopMakefileOasis3 | |
mv -v ${OASIS_ROOT}/install/include/* ${PARFLOW_DEP_DIR}/include/ | |
mv -v ${OASIS_ROOT}/install/lib/* ${PARFLOW_DEP_DIR}/lib/ | |
fi | |
- name: SILO Install | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
URL=https://github.com/LLNL/Silo/archive/refs/tags/4.11.tar.gz | |
mkdir silo | |
cd silo | |
curl -L $URL | tar --strip-components=1 -xz | |
./configure --disable-silex --disable-hzip --disable-fpzip --prefix=$PARFLOW_DEP_DIR | |
make -j 2 install | |
fi | |
- name: HYPRE Install | |
env: | |
CACHE_HIT: ${{steps.cache-parflow-dependencies.outputs.cache-hit}} | |
run: | | |
if [[ "$CACHE_HIT" != 'true' ]]; then | |
URL=https://github.com/hypre-space/hypre/archive/v2.26.0.tar.gz | |
mkdir hypre | |
cd hypre | |
curl -L $URL | tar --strip-components=1 -xz | |
cd src | |
./configure --prefix=$PARFLOW_DEP_DIR | |
make -j 2 install | |
fi | |
- name: ParFlow CMake Configure | |
run: | | |
cat $HOME/depend/cache-key | |
export OMPI_MCA_rmaps_base_oversubscribe=1 | |
export OMP_NUM_THREADS=1 | |
${{ matrix.config.cc }} -v | |
mpicc -v | |
if [[ "${{ matrix.config.amps_layer }}" == "oas3" ]]; then HAVE_CLM="OFF"; else HAVE_CLM="ON"; fi | |
CFLAGS="-Wall -Werror -Wno-unused-result -Wno-unused-function -Wno-stringop-overread" | |
if [[ "${{ matrix.config.cc }}" == "gcc" ]]; then CFLAGS="${CFLAGS} -Wno-stringop-overread"; fi | |
export CC=mpicc CXX=mpicxx F77=mpif77 FC=mpif90 CUDAHOSTCXX=mpicxx | |
cmake -Bbuild \ | |
-DCMAKE_BUILD_TYPE=Release \ | |
-DCMAKE_C_FLAGS=$CFLAGS \ | |
-DPARFLOW_ENABLE_TIMING=TRUE \ | |
-DPARFLOW_AMPS_LAYER=${{ matrix.config.amps_layer }} \ | |
-DMPIEXEC_POSTFLAGS='--oversubscribe' \ | |
-DPARFLOW_ACCELERATOR_BACKEND=${{ matrix.config.backend }} \ | |
-DPARFLOW_AMPS_SEQUENTIAL_IO=true \ | |
-DPARFLOW_HAVE_CLM=${HAVE_CLM} \ | |
-DHYPRE_ROOT=$PARFLOW_DEP_DIR \ | |
-DOAS3_ROOT=$PARFLOW_DEP_DIR \ | |
-DSILO_ROOT=$PARFLOW_DEP_DIR \ | |
-DPARFLOW_ENABLE_PYTHON=${{ matrix.config.python }} \ | |
-DCMAKE_INSTALL_PREFIX=$PARFLOW_DIR \ | |
$NETCDF_FLAGS $KOKKOS_FLAGS $RMM_FLAGS | |
- name: ParFlow CMake Build | |
run: (cd build; make -j 2 install) | |
# Can't test with GPU since have no GPU hardware on testing nodes, GPU test is build only | |
- name: ParFlow CTest | |
if: matrix.config.backend != 'cuda' && matrix.config.backend != 'kokkos' | |
run: | | |
export OMPI_MCA_rmaps_base_oversubscribe=1 | |
export OMP_NUM_THREADS=1 | |
(cd build; ctest --output-on-failure) |