Skip to content

Commit

Permalink
separate horovod ds installation script into two files
Browse files Browse the repository at this point in the history
  • Loading branch information
jarlsondre committed Nov 28, 2024
1 parent 69e1dd2 commit bb815e6
Show file tree
Hide file tree
Showing 2 changed files with 21 additions and 20 deletions.
20 changes: 20 additions & 0 deletions env-files/torch/horovod-deepspeed.slurm
Original file line number Diff line number Diff line change
@@ -0,0 +1,20 @@
#!/bin/bash

# Job configuration
#SBATCH --job-name=setup_venv
#SBATCH --account=intertwin
#SBATCH --output=horovod_ds_installation.out
#SBATCH --error=horovod_ds_installation.err
#SBATCH --time=00:30:00

# Resources allocation
#SBATCH --partition=develbooster
#SBATCH --nodes=1
#SBATCH --gres=gpu

ml --force purge
ml Stages/2024 GCC OpenMPI CUDA/12 cuDNN MPI-settings/CUDA
ml Python/3.11.3 CMake HDF5 PnetCDF libaio mpi4py git Clang

source .venv/bin/activate
bash install-horovod-deepspeed-cuda.sh
21 changes: 1 addition & 20 deletions env-files/torch/install-horovod-deepspeed-cuda.sh
Original file line number Diff line number Diff line change
@@ -1,23 +1,3 @@
#!/bin/bash

# Job configuration
#SBATCH --job-name=setup_venv
#SBATCH --account=intertwin
#SBATCH --output=horovod_ds_installation.out
#SBATCH --error=horovod_ds_installation.err
#SBATCH --time=00:30:00

# Resources allocation
#SBATCH --partition=develbooster
#SBATCH --nodes=1
#SBATCH --gres=gpu

ml --force purge
ml Stages/2024 GCC OpenMPI CUDA/12 cuDNN MPI-settings/CUDA
ml Python/3.11.3 CMake HDF5 PnetCDF libaio mpi4py git Clang

source .venv/bin/activate

# DeepSpeed variables
export DS_BUILD_CCL_COMM=1
export DS_BUILD_UTILS=1
Expand All @@ -28,6 +8,7 @@ export DS_BUILD_TRANSFORMER=1
export DS_BUILD_STOCHASTIC_TRANSFORMER=1
export DS_BUILD_TRANSFORMER_INFERENCE=1

# We do --no-cache-dir because the .cache dir eats our HPC quota :(
pip install --no-cache-dir --no-build-isolation "deepspeed==0.15.*"

# Horovod variables
Expand Down

0 comments on commit bb815e6

Please sign in to comment.