bugfix: gemm_sm90 compilation error (#589)

The pre-commit hook (#584) re-ordered the headers. It causes `group_gemm_sm90.cuh` not able to compile. This PR add a clang-format section to preserve the include order. Related: NVIDIA/cutlass#1827
flashinfer-ai · Nov 6, 2024 · 1328693 · 1328693
1 parent 2332e8a
commit 1328693
Showing 1 changed file with 6 additions and 1 deletion.
diff --git a/include/flashinfer/gemm/group_gemm_sm90.cuh b/include/flashinfer/gemm/group_gemm_sm90.cuh
@@ -16,6 +16,12 @@
 #ifndef FLASHINFER_GEMM_GROUP_GEMM_SM90_CUH_
 #define FLASHINFER_GEMM_GROUP_GEMM_SM90_CUH_
 
+// clang-format off
+// NOTE: This header needs to be included before cutlass headers.
+// See: https://github.com/NVIDIA/cutlass/issues/1827
+#include "group_gemm_cutlass.cuh"
+// clang-format on
+
 #include <sstream>
 
 #include "../allocator.h"
@@ -39,7 +45,6 @@
 #include "cutlass/util/reference/device/tensor_compare.h"
 #include "cutlass/util/reference/device/tensor_fill.h"
 #include "cutlass/util/tensor_view_io.h"
-#include "group_gemm_cutlass.cuh"
 
 namespace flashinfer {