Skip to content

Commit

Permalink
Add Ampere GEMM example in Cute and CUTLASS 3.x
Browse files Browse the repository at this point in the history
  • Loading branch information
aacostadiaz committed Aug 2, 2024
1 parent 8c5841c commit 4c0c974
Show file tree
Hide file tree
Showing 2 changed files with 428 additions and 256 deletions.
13 changes: 5 additions & 8 deletions examples/14_ampere_tf32_tensorop_gemm/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -27,22 +27,19 @@
# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


if (CUTLASS_ENABLE_SYCL)
if (SYCL_NVIDIA_TARGET)
cutlass_example_add_executable(
14_ampere_tf32_tensorop_gemm_cute
ampere_tf32_tensorop_gemm_cute.cpp
cutlass_example_add_executable(
14_ampere_tf32_tensorop_gemm_cute
ampere_tf32_tensorop_gemm_cute.cu
)
endif()
else()
cutlass_example_add_executable(
14_ampere_tf32_tensorop_gemm
ampere_tf32_tensorop_gemm.cu
)
)

cutlass_example_add_executable(
14_ampere_tf32_tensorop_gemm_cute
ampere_tf32_tensorop_gemm_cute.cu
)
)
endif()
Loading

0 comments on commit 4c0c974

Please sign in to comment.