Skip to content

Commit

Permalink
Add a workaround for LLVM fpext bug causing test failure on Skylake CPU.
Browse files Browse the repository at this point in the history
Signed-off-by: Ilya Enkovich <[email protected]>
  • Loading branch information
ienkovich committed Jun 17, 2024
1 parent e9c0801 commit 02db84c
Showing 1 changed file with 6 additions and 0 deletions.
6 changes: 6 additions & 0 deletions python/test/unit/language/test_core.py
Original file line number Diff line number Diff line change
Expand Up @@ -2147,6 +2147,12 @@ def kernel(X, Z, BLOCK: tl.constexpr):
def test_reduce(op, dtype_str, shape, axis, keep_dims, num_ctas, device):
check_type_supported(dtype_str, device) # bfloat16 on cc < 80 will not be tested

# fpext fp16->fp32 is broken in LLVM for large vectors:
# https://github.com/llvm/llvm-project/issues/95278
# TODO: remove the change after the bug is fixed.
if is_cpu() and dtype_str == "float16":
shape = (min(shape[0], 512), min(shape[1], 512))

@triton.jit
def kernel(X, Z, BLOCK_M: tl.constexpr, BLOCK_N: tl.constexpr, BLOCK_K: tl.constexpr, IS_3D: tl.constexpr,
AXIS: tl.constexpr, KEEP_DIMS: tl.constexpr):
Expand Down

0 comments on commit 02db84c

Please sign in to comment.