Skip to content

Commit

Permalink
Update default CUDA Toolkit version to 12.5.1
Browse files Browse the repository at this point in the history
This updates CUDA for both TF and XLA. It also enables the CUDA driver forward
compatibility mode for XLA since XLA's CUDA graph integration needs a newer
driver version.

PiperOrigin-RevId: 673974335
  • Loading branch information
beckerhe authored and Google-ML-Automation committed Sep 12, 2024
1 parent 0116756 commit 29048bb
Show file tree
Hide file tree
Showing 4 changed files with 9 additions and 10 deletions.
2 changes: 1 addition & 1 deletion .bazelrc
Original file line number Diff line number Diff line change
Expand Up @@ -219,7 +219,7 @@ build:cuda --repo_env TF_NEED_CUDA=1
build:cuda --crosstool_top=@local_config_cuda//crosstool:toolchain
build:cuda --@local_config_cuda//:enable_cuda
# Default CUDA and CUDNN versions.
build:cuda --repo_env=HERMETIC_CUDA_VERSION="12.3.2"
build:cuda --repo_env=HERMETIC_CUDA_VERSION="12.5.1"
build:cuda --repo_env=HERMETIC_CUDNN_VERSION="9.3.0"
# This flag is needed to include CUDA libraries.
build:cuda --@local_config_cuda//cuda:include_cuda_libs=true
Expand Down
13 changes: 6 additions & 7 deletions build_tools/ci/build.py
Original file line number Diff line number Diff line change
Expand Up @@ -216,14 +216,13 @@ def nvidia_gpu_build_with_compute_capability(
test_tag_filters=("-no_oss", "requires-gpu-nvidia", "gpu")
+ extra_gpu_tags,
build_tag_filters=("-no_oss", "requires-gpu-nvidia", "gpu"),
options=dict(
run_under="//tools/ci_build/gpu_build:parallel_gpu_execute",
repo_env=f"TF_CUDA_COMPUTE_CAPABILITIES={compute_capability/10}",
options={
"run_under": "//tools/ci_build/gpu_build:parallel_gpu_execute",
"repo_env": f"TF_CUDA_COMPUTE_CAPABILITIES={compute_capability/10}",
"@cuda_driver//:enable_forward_compatibility": "true",
**_DEFAULT_BAZEL_OPTIONS,
),
extra_setup_commands=(
["nvidia-smi"],
),
},
extra_setup_commands=(["nvidia-smi"],),
)


Expand Down
2 changes: 1 addition & 1 deletion build_tools/ci/golden_commands.txt
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@ $KOKORO_ARTIFACTS_DIR/github/xla/.kokoro/generate_index_html.sh index.html
nvidia-smi
parallel --ungroup --retries 3 --delay 15 docker pull ::: gcr.io/tensorflow-sigs/build:latest-python3.11
docker run --detach --name=xla_ci --rm --interactive --tty --volume=./github:/github --workdir=/github/xla gcr.io/tensorflow-sigs/build:latest-python3.11 bash
docker exec xla_ci bazel test --build_tag_filters=-no_oss,requires-gpu-nvidia,gpu --test_tag_filters=-no_oss,requires-gpu-nvidia,gpu,requires-gpu-sm75-only,requires-gpu-sm60,requires-gpu-sm70,-requires-gpu-sm80,-requires-gpu-sm80-only,-requires-gpu-sm90,-requires-gpu-sm90-only,-requires-gpu-amd --config=warnings --config=rbe_linux_cuda_nvcc --run_under=//tools/ci_build/gpu_build:parallel_gpu_execute --repo_env=TF_CUDA_COMPUTE_CAPABILITIES=7.5 --test_output=errors --verbose_failures --keep_going --nobuild_tests_only --profile=profile.json.gz --flaky_test_attempts=3 --jobs=150 --bes_upload_mode=fully_async -- //xla/... //build_tools/... @tsl//tsl/...
docker exec xla_ci bazel test --build_tag_filters=-no_oss,requires-gpu-nvidia,gpu --test_tag_filters=-no_oss,requires-gpu-nvidia,gpu,requires-gpu-sm75-only,requires-gpu-sm60,requires-gpu-sm70,-requires-gpu-sm80,-requires-gpu-sm80-only,-requires-gpu-sm90,-requires-gpu-sm90-only,-requires-gpu-amd --config=warnings --config=rbe_linux_cuda_nvcc --run_under=//tools/ci_build/gpu_build:parallel_gpu_execute --repo_env=TF_CUDA_COMPUTE_CAPABILITIES=7.5 --@cuda_driver//:enable_forward_compatibility=true --test_output=errors --verbose_failures --keep_going --nobuild_tests_only --profile=profile.json.gz --flaky_test_attempts=3 --jobs=150 --bes_upload_mode=fully_async -- //xla/... //build_tools/... @tsl//tsl/...
docker exec xla_ci bazel analyze-profile profile.json.gz
docker stop xla_ci
# END BuildType.GPU
Expand Down
2 changes: 1 addition & 1 deletion third_party/tsl/.bazelrc
Original file line number Diff line number Diff line change
Expand Up @@ -219,7 +219,7 @@ build:cuda --repo_env TF_NEED_CUDA=1
build:cuda --crosstool_top=@local_config_cuda//crosstool:toolchain
build:cuda --@local_config_cuda//:enable_cuda
# Default CUDA and CUDNN versions.
build:cuda --repo_env=HERMETIC_CUDA_VERSION="12.3.2"
build:cuda --repo_env=HERMETIC_CUDA_VERSION="12.5.1"
build:cuda --repo_env=HERMETIC_CUDNN_VERSION="9.3.0"
# This flag is needed to include CUDA libraries.
build:cuda --@local_config_cuda//cuda:include_cuda_libs=true
Expand Down

0 comments on commit 29048bb

Please sign in to comment.