diff --git a/.ci/docker/conda/build.sh b/.ci/docker/conda/build.sh index 6e8a1c37ff9fb..b613e195ade0d 100755 --- a/.ci/docker/conda/build.sh +++ b/.ci/docker/conda/build.sh @@ -37,6 +37,12 @@ esac ( set -x + # TODO: Remove LimitNOFILE=1048576 patch once https://github.com/pytorch/test-infra/issues/5712 + # is resolved. This patch is required in order to fix timing out of Docker build on Amazon Linux 2023. + sudo sed -i s/LimitNOFILE=infinity/LimitNOFILE=1048576/ /usr/lib/systemd/system/docker.service + sudo systemctl daemon-reload + sudo systemctl restart docker + docker build \ --target final \ --progress plain \ diff --git a/.ci/docker/manywheel/Dockerfile b/.ci/docker/manywheel/Dockerfile index 39b5d04b4d20a..a4fb127d178e2 100644 --- a/.ci/docker/manywheel/Dockerfile +++ b/.ci/docker/manywheel/Dockerfile @@ -10,6 +10,7 @@ ENV LANG en_US.UTF-8 ENV LANGUAGE en_US.UTF-8 ARG DEVTOOLSET_VERSION=9 + # Note: This is required patch since CentOS have reached EOL # otherwise any yum install setp will fail RUN sed -i s/mirror.centos.org/vault.centos.org/g /etc/yum.repos.d/*.repo diff --git a/.ci/docker/manywheel/build.sh b/.ci/docker/manywheel/build.sh index 0cfb88ef72fb6..2ea02c4eb1d00 100755 --- a/.ci/docker/manywheel/build.sh +++ b/.ci/docker/manywheel/build.sh @@ -124,7 +124,14 @@ if [[ -n ${MANY_LINUX_VERSION} && -z ${DOCKERFILE_SUFFIX} ]]; then fi ( set -x - DOCKER_BUILDKIT=1 docker build \ + + # TODO: Remove LimitNOFILE=1048576 patch once https://github.com/pytorch/test-infra/issues/5712 + # is resolved. This patch is required in order to fix timing out of Docker build on Amazon Linux 2023. + sudo sed -i s/LimitNOFILE=infinity/LimitNOFILE=1048576/ /usr/lib/systemd/system/docker.service + sudo systemctl daemon-reload + sudo systemctl restart docker + + DOCKER_BUILDKIT=1 docker build \ ${DOCKER_GPU_BUILD_ARG} \ --build-arg "GPU_IMAGE=${GPU_IMAGE}" \ --target "${TARGET}" \ diff --git a/.github/workflows/build-conda-images.yml b/.github/workflows/build-conda-images.yml index 4962276321cc6..4d2f146a7577d 100644 --- a/.github/workflows/build-conda-images.yml +++ b/.github/workflows/build-conda-images.yml @@ -32,7 +32,7 @@ concurrency: jobs: build-docker: environment: ${{ (github.ref == 'refs/heads/main' || startsWith(github.event.ref, 'refs/tags/v')) && 'docker-build' || '' }} - runs-on: am2.linux.9xlarge.ephemeral + runs-on: linux.9xlarge.ephemeral strategy: matrix: cuda_version: ["11.8", "12.1", "12.4", "cpu"] diff --git a/.github/workflows/build-manywheel-images.yml b/.github/workflows/build-manywheel-images.yml index 750ee99d52e38..7ecf278c58575 100644 --- a/.github/workflows/build-manywheel-images.yml +++ b/.github/workflows/build-manywheel-images.yml @@ -45,7 +45,7 @@ jobs: build-docker-cuda: environment: ${{ (github.ref == 'refs/heads/main' || startsWith(github.event.ref, 'refs/tags/v')) && 'docker-build' || '' }} needs: get-label-type - runs-on: "${{ needs.get-label-type.outputs.label-type }}am2.linux.9xlarge.ephemeral" + runs-on: "${{ needs.get-label-type.outputs.label-type }}linux.9xlarge.ephemeral" strategy: matrix: cuda_version: ["12.4", "12.1", "11.8"] @@ -156,7 +156,7 @@ jobs: build-docker-rocm: environment: ${{ (github.ref == 'refs/heads/main' || startsWith(github.event.ref, 'refs/tags/v')) && 'docker-build' || '' }} needs: get-label-type - runs-on: "${{ needs.get-label-type.outputs.label-type }}am2.linux.9xlarge.ephemeral" + runs-on: "${{ needs.get-label-type.outputs.label-type }}linux.9xlarge.ephemeral" strategy: matrix: rocm_version: ["6.1", "6.2"] @@ -192,7 +192,7 @@ jobs: build-docker-cpu: environment: ${{ (github.ref == 'refs/heads/main' || startsWith(github.event.ref, 'refs/tags/v')) && 'docker-build' || '' }} needs: get-label-type - runs-on: "${{ needs.get-label-type.outputs.label-type }}am2.linux.9xlarge.ephemeral" + runs-on: "${{ needs.get-label-type.outputs.label-type }}linux.9xlarge.ephemeral" steps: - name: Checkout PyTorch uses: pytorch/pytorch/.github/actions/checkout-pytorch@main