Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
28 changes: 12 additions & 16 deletions .github/workflows/nightly_tests.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,7 @@ permissions:

env:
CLUSTER_NETWORK_ARGUMENTS: "--network=${{secrets.NETWORK_NAME}} --subnetwork=${{secrets.SUBNETWORK_NAME}}"
CLUSTER_NETWORK_ARGUMENTS_DWS: "--network=${{secrets.NETWORK_NAME}} --subnetwork=${{secrets.SUBNETWORK_NAME_DWS}}"

jobs:
build_wheel:
Expand All @@ -39,7 +40,8 @@ jobs:
env:
EMPTY_CLUSTER_NAME: nightly-xpk-zero-nodepools
PRIVATE_CLUSTER_NAME: nightly-xpk-private-2-v4-8-nodepools
TPU_CLUSTER_NAME: nightly-xpk-2-v4-8-nodepools
DWS_FLEX_CLUSTER_NAME: xpk-dws-nightly-test-2-v4-8
TPU_CLUSTER_NAME: nightly-xpk-2-v5p-8-nodepools
WORKLOAD_NAME: xpktest-nightly-${{ github.run_attempt }}
steps:
- uses: actions/download-artifact@v4
Expand Down Expand Up @@ -140,6 +142,14 @@ jobs:
- name: Delete the cluster created
if: always()
run: xpk cluster delete --cluster $TPU_CLUSTER_NAME --zone=us-central2-b --force
- name: Create a DWS flex queued xpk cluster
run: xpk cluster create --cluster ${DWS_FLEX_CLUSTER_NAME} --tpu-type=v5p-8 --num-slices=1 --zone=us-east5-a --default-pool-cpu-num-nodes=2 --flex --custom-cluster-arguments="${CLUSTER_NETWORK_ARGUMENTS_DWS}"
- name: Run dws flex queued TPU workload
run: xpk workload create --workload xpktest-build-${{ github.run_attempt }}-dws --cluster ${DWS_FLEX_CLUSTER_NAME} --zone=us-east5-a --tpu-type=v5p-8 --flex --command "echo foo" --num-slices=1
- name: Wait for workload completion and confirm it succeeded
run: xpk workload list --cluster ${DWS_FLEX_CLUSTER_NAME} --zone=us-east5-a --wait-for-job-completion xpktest-build-${{ github.run_attempt }}-dws --timeout 1000
- name: Delete the DWS flex queued cluster
run: xpk cluster delete --cluster ${DWS_FLEX_CLUSTER_NAME}
- name: Upload cluster nodepool creation log
if: always()
uses: actions/upload-artifact@v4
Expand Down Expand Up @@ -343,22 +353,8 @@ jobs:
location: '${{needs.set-variables.outputs.location}}'
run-id: '${{needs.set-variables.outputs.run-id}}'
secrets: inherit
workloads-tests:
needs: [cluster-create, set-variables]
uses: ./.github/workflows/reusable_workload_tests.yaml
concurrency: # We support one build or nightly test to run at a time currently.
group: workload-tests-${{needs.set-variables.outputs.run-id}}
cancel-in-progress: true
with:
cluster-name: ${{needs.set-variables.outputs.cluster-name}}
cluster-name-dws: '${{needs.set-variables.outputs.cluster-name-dws}}'
tpu-type: ${{needs.set-variables.outputs.tpu-type}}
tpu-type-topology: ${{needs.set-variables.outputs.tpu-type-topology}}
zone: ${{needs.set-variables.outputs.zone}}
run-id: '${{needs.set-variables.outputs.run-id}}'
secrets: inherit
storage-tests:
needs: [cluster-create, set-variables, workloads-tests]
needs: [cluster-create, set-variables]
uses: ./.github/workflows/reusable_storage_tests.yaml
concurrency: # We support one build or nightly test to run at a time currently.
group: storage-tests-${{needs.set-variables.outputs.run-id}}
Expand Down
127 changes: 0 additions & 127 deletions .github/workflows/reusable_workload_tests.yaml

This file was deleted.

Loading