Skip to content

Commit

Permalink
Intel/CI: Add OneCCL CPU tests with DSA + shm to the CI
Browse files Browse the repository at this point in the history
- Add OneCCL DSA stage.
- There was an issue with libfabric being built with ze and oneccl built without.
This led to failure and CCL transport being switched to MPI because oneccl looked for the library.
To avoid this, an else case is added with --with-ze=no.

Signed-off-by: Juee Himalbhai Desai <[email protected]>
  • Loading branch information
Juee14Desai authored and zachdworkin committed Mar 20, 2024
1 parent 5e11910 commit cc1c950
Show file tree
Hide file tree
Showing 2 changed files with 14 additions and 8 deletions.
20 changes: 12 additions & 8 deletions contrib/intel/jenkins/Jenkinsfile
Original file line number Diff line number Diff line change
Expand Up @@ -694,18 +694,22 @@ pipeline {
}
}
}
stage ('oneCCL') {
stage ('oneCCL') {
steps {
script {
dir (RUN_LOCATION) {
run_middleware([["verbs", null]], "oneCCL",
run_middleware([["verbs", null]], "oneCCL",
"oneccl", "water", "squirtle,totodile", "2")
run_middleware([["shm", null]], "oneCCL",
"oneccl", "grass", "bulbasaur", "1")
run_middleware([["psm3", null]], "oneCCL",
"oneccl", "water", "squirtle", "2")
run_middleware([["tcp", null]], "oneCCL",
"oneccl", "grass", "bulbasaur", "2")
run_middleware([["shm", null]], "oneCCL",
"oneccl", "grass", "bulbasaur", "1")
run_middleware([["psm3", null]], "oneCCL",
"oneccl", "water", "squirtle", "2")
run_middleware([["tcp", null]], "oneCCL",
"oneccl", "grass", "bulbasaur", "2")
run_middleware([["shm", null]], "oneCCL_DSA",
"oneccl", "electric", "pikachu", "1", null, null,
"""CCL_ATL_SHM=1 FI_SHM_DISABLE_CMA=1 \
FI_SHM_USE_DSA_SAR=1 FI_LOG_LEVEL=warn""")
}
}
}
Expand Down
2 changes: 2 additions & 0 deletions contrib/intel/jenkins/build.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,8 @@ def build_libfabric(libfab_install_path, mode, hw_type, gpu=False, cuda=False):

if (gpu):
config_cmd.append('--enable-ze-dlopen')
else:
config_cmd.append('--with-ze=no')

if (cuda):
config_cmd.append(f'--with-cuda={os.environ["CUDA_INSTALL"]}')
Expand Down

0 comments on commit cc1c950

Please sign in to comment.