From a4987ba326949b230c05368c0095ff8a1198098f Mon Sep 17 00:00:00 2001 From: Jean-Baptiste Dalido Date: Thu, 12 Sep 2024 15:05:10 +0000 Subject: [PATCH] build/ci: enable bazel remote caching --- .github/runs-on.yml | 11 +++++++++++ .github/workflows/build.yaml | 15 +++++++++------ 2 files changed, 20 insertions(+), 6 deletions(-) create mode 100644 .github/runs-on.yml diff --git a/.github/runs-on.yml b/.github/runs-on.yml new file mode 100644 index 0000000..179a167 --- /dev/null +++ b/.github/runs-on.yml @@ -0,0 +1,11 @@ +images: + ubuntu24-amd64: + platform: "linux" + arch: "amd64" + ami: "ami-04a92520784b93e73" + preinstall: | + #!/bin/bash + wget https://github.com/jbdalido/bazel-remote/releases/download/test/bazel-remote -O /usr/local/bin/bzlcache + chmod +x /usr/local/bin/bzlcache + echo "Run bazel cache" + systemd-run --property=Restart=always /usr/local/bin/bzlcache --max_size=1000 --grpc_address 127.0.0.1:15501 --dir=/tmp/cache --s3.region eu-west-3 --s3.bucket runs-on-s3bucketcache-jycgicewbssh --s3.auth_method iam_role --s3.prefix cache --s3.endpoint=s3.eu-west-3.amazonaws.com --storage_mode uncompressed \ No newline at end of file diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml index 3217fb3..4d3b305 100644 --- a/.github/workflows/build.yaml +++ b/.github/workflows/build.yaml @@ -74,21 +74,21 @@ jobs: config: "--config=cuda" artifact: libpjrt_c_api_gpu_plugin.so renamed_artifact: libpjrt_cuda.so - runs_on: ['runs-on','runner=32cpu-linux-x64'] + runs_on: ['runs-on','runner=32cpu-linux-x64', 'image=ubuntu24-amd64'] platform: linux-amd64 bazel_target: //xla/pjrt/c:pjrt_c_api_gpu_plugin - target: rocm config: "--config=rocm" artifact: libpjrt_c_api_gpu_plugin.so renamed_artifact: libpjrt_rocm.so - runs_on: ['runs-on','runner=32cpu-linux-x64'] + runs_on: ['runs-on','runner=32cpu-linux-x64', 'image=ubuntu24-amd64'] platform: linux-amd64 bazel_target: //xla/pjrt/c:pjrt_c_api_gpu_plugin - target: cpu config: "" artifact: libpjrt_c_api_cpu_plugin.so renamed_artifact: libpjrt_cpu.so - runs_on: ['runs-on','runner=32cpu-linux-x64'] + runs_on: ['runs-on','runner=32cpu-linux-x64', 'image=ubuntu24-amd64'] platform: linux-amd64 bazel_target: //xla/pjrt/c:pjrt_c_api_cpu_plugin @@ -99,25 +99,28 @@ jobs: - name: Setup Bazel run: | - wget https://github.com/bazelbuild/bazelisk/releases/download/v1.20.0/bazelisk-linux-amd64 -O /usr/local/bin/bazel - chmod +x /usr/local/bin/bazel + wget https://github.com/bazelbuild/bazelisk/releases/download/v1.20.0/bazelisk-linux-amd64 -O ~/bin/bazel + chmod +x ~/bin/bazel - name: Force remove container run: | docker rm -f pjrt-${{ matrix.pjrt.target }} - name: "Build ${{ matrix.pjrt.target }} ${{ matrix.pjrt.platform }} image" - run: bazel run //${{ matrix.pjrt.target }}:${{ matrix.pjrt.target }}_stripped_tarball + run: | + ~/bin/bazel run //${{ matrix.pjrt.target }}:${{ matrix.pjrt.target }}_stripped_tarball - name: "Run ${{ matrix.pjrt.target }} ${{ matrix.pjrt.platform }} image" run: | docker run \ --name=pjrt-${{ matrix.pjrt.target }} \ -w=/xla \ + --net=host \ -v=/tmp/cache:/tmp/cache \ distroless/${{ matrix.pjrt.target }}_builder:latest \ bazelisk \ build \ + --remote_cache=grpc://127.0.0.1:15501 \ --disk_cache=/tmp/cache \ ${{ matrix.pjrt.config }} --repo_env=HERMETIC_PYTHON_VERSION=3.11 \ ${{ matrix.pjrt.bazel_target }}