Skip to content

Commit

Permalink
Use syclcompat::dp4a
Browse files Browse the repository at this point in the history
  • Loading branch information
aacostadiaz committed Dec 5, 2024
1 parent e322028 commit ce8d683
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions include/cutlass/numeric_conversion.h
Original file line number Diff line number Diff line change
Expand Up @@ -3664,10 +3664,10 @@ struct NumericArrayConverter<float, int8_t, N, Round> {

CUTLASS_PRAGMA_UNROLL
for (int ii = 0; ii < PackedResultType::kElements; ++ii) {
#if defined(__CUDA_ARCH__)
t[ii] = __dp4a(x, mask[ii], 0);
#if defined(CUTLASS_ENABLE_SYCL)
t[ii] = syclcompat::dp4a(x, mask[ii], 0);
#else
t[ii] = x * mask[ii];
t[ii] = __dp4a(x, mask[ii], 0);
#endif
r[ii] = static_cast<float>(t[ii]);
}
Expand Down

0 comments on commit ce8d683

Please sign in to comment.