Skip to content

Commit

Permalink
Merge pull request #325 from chaitanya1731/gaudi_networking
Browse files Browse the repository at this point in the history
tests: Gaudi L2 Tests updated for v1.18.0-524
  • Loading branch information
uMartinXu authored Oct 16, 2024
2 parents 4011c07 + 5343099 commit f412cd1
Show file tree
Hide file tree
Showing 3 changed files with 4 additions and 13 deletions.
13 changes: 2 additions & 11 deletions tests/gaudi/l2/hccl_build.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -13,29 +13,20 @@ spec:
output:
to:
kind: ImageStreamTag
name: 'hccl-demo-workload:latest'
name: 'hccl-demo-workload:1.18.0-524'
strategy:
type: Docker
source:
type: Dockerfile
dockerfile: |
ARG BUILDER=vault.habana.ai/gaudi-docker/1.17.1/rhel9.4/habanalabs/pytorch-installer-2.3.1:1.17.1-40
ARG BUILDER=vault.habana.ai/gaudi-docker/1.18.0/rhel9.4/habanalabs/pytorch-installer-2.4.0:1.18.0-524
FROM ${BUILDER} AS builder
WORKDIR /
RUN git clone https://github.com/HabanaAI/hccl_demo.git \
&& cd hccl_demo \
&& make
WORKDIR /
RUN git clone https://github.com/HabanaAI/hccl_ofi_wrapper.git \
&& export LIBFABRIC_ROOT=/opt/habanalabs/libfabric-1.20.0 \
&& cd hccl_ofi_wrapper \
&& make \
&& cp libhccl_ofi_wrapper.so /usr/lib/habanalabs/libhccl_ofi_wrapper.so \
&& ldconfig \
&& export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/lib/habanalabs/
WORKDIR /hccl_demo
triggers:
- type: ConfigChange
Expand Down
2 changes: 1 addition & 1 deletion tests/gaudi/l2/hccl_job.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ spec:
serviceAccountName: hccl-demo-anyuid-sa
containers:
- name: hccl-demo-workload
image: image-registry.openshift-image-registry.svc:5000/hccl-demo/hccl-demo-workload:latest
image: image-registry.openshift-image-registry.svc:5000/hccl-demo/hccl-demo-workload:1.18.0-524
workingDir: "/hccl_demo"
command: ["/bin/bash", "-c", "--"]
## sleep for 20 seconds to avoid race condition
Expand Down
2 changes: 1 addition & 1 deletion tests/gaudi/l2/hl-smi_job.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ spec:
restartPolicy: Never
containers:
- name: hl-smi-workload
image: vault.habana.ai/gaudi-docker/1.17.1/rhel9.4/habanalabs/pytorch-installer-2.3.1:1.17.1-40
image: vault.habana.ai/gaudi-docker/1.18.0/rhel9.4/habanalabs/pytorch-installer-2.4.0:1.18.0-524
command: ["hl-smi"]
resources:
limits:
Expand Down

0 comments on commit f412cd1

Please sign in to comment.