forked from NVIDIA/cutlass
-
Notifications
You must be signed in to change notification settings - Fork 21
83 lines (75 loc) · 2.83 KB
/
test.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
name: "Test"
on:
push:
branches: [ "sycl-develop" ]
pull_request:
branches: [ "sycl-develop" ]
workflow_dispatch:
inputs:
DPCPP_VERSION:
description: "DPCPP version to use"
type: string
permissions: {}
jobs:
run-tests:
name: Run tests
runs-on: cp-nvidia-gpu
timeout-minutes: 30
steps:
- name: Checkout repository
uses: actions/checkout@a5ac7e51b41094c92402da3b24376905380afc29 # v4.1.6
- name: Install dependencies
shell: bash
run: |
nvidia-smi
mkdir ~/dpcpp
pushd ~/dpcpp
echo "Will use DPCPP ${{ inputs.DPCPP_VERSION }}."
if [[ "${{ inputs.DPCPP_VERSION }}" != "" ]]; then \
echo "Downloading DPCPP from https://github.com/intel/llvm/releases/download/${{ inputs.DPCPP_VERSION }}/sycl_linux.tar.gz"; \
wget -q https://github.com/intel/llvm/releases/download/${{ inputs.DPCPP_VERSION }}/sycl_linux.tar.gz; \
else
latest=$(curl -sS https://api.github.com/repos/intel/llvm/releases | jq -r '[.[].tag_name|select(match("nightly-[0-9]{4}-[0-9]{2}-[0-9]{2}"))][0]') && \
echo "Downloading DPCPP from https://github.com/intel/llvm/releases/download/${latest}/sycl_linux.tar.gz"; \
wget -q https://github.com/intel/llvm/releases/download/${latest}/sycl_linux.tar.gz; \
fi
tar -xf sycl_linux.tar.gz
rm sycl_linux.tar.gz
popd
# For a specific DPC++ nightly build define the repository variable DPCPP_VERSION
# for example using the tag: 'nightly-2024-04-22'
- name: Build
shell: bash
run: |
export PATH=~/dpcpp/bin/:$PATH
export C_INCLUDE_PATH=~/dpcpp/include/:$C_INCLUDE_PATH
export CPLUS_INCLUDE_PATH=~/dpcpp/include/:$CPLUS_INCLUDE_PATH
export LD_LIBRARY_PATH=~/dpcpp/lib/:$LD_LIBRARY_PATH
export CC=clang
export CXX=clang++
clang++ --version
cmake -G Ninja \
-DCMAKE_CUDA_HOST_COMPILER=clang++ \
-DCUTLASS_ENABLE_SYCL=ON \
-DDPCPP_SYCL_TARGET=nvptx64-nvidia-cuda \
-DDPCPP_SYCL_ARCH=sm_80
cmake --build .
- name: Unit test
shell: bash
run: |
export LD_LIBRARY_PATH=~/dpcpp/lib/:$LD_LIBRARY_PATH
cmake --build . --target test_unit -j 24
- name: Examples
shell: bash
run: |
export LD_LIBRARY_PATH=~/dpcpp/lib/:$LD_LIBRARY_PATH
echo Run sgemm_1
./examples/cute/tutorial/sgemm_1
echo Run sgemm_2
./examples/cute/tutorial/sgemm_2
echo Run sgemm_sm70
./examples/cute/tutorial/sgemm_sm70
echo Run sgemm_sm80
./examples/cute/tutorial/sgemm_sm80
echo Run tiled_copy
./examples/cute/tutorial/tiled_copy