Skip to content

Commit 703e23b

Browse files
committed
Added UTs for different datatype in epilogue
Signed-off-by: Chawla, Amit K <[email protected]>
1 parent db77438 commit 703e23b

File tree

2 files changed

+7
-4
lines changed

2 files changed

+7
-4
lines changed

include/cutlass/epilogue/collective/xe_array_epilogue.hpp

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -132,19 +132,22 @@ class CollectiveEpilogue<
132132
using CopyThreadShape = Shape<_1, Int<SubgroupSize>>;
133133

134134
using Trait_D = Copy_Traits<GmemTiledCopyD, InternalStrideD>;
135+
using val_layout_store_D = decltype(make_layout(shape_div(typename Trait_D::BlockShape{}, CopyThreadShape{})));
135136
using XE_Copy_D = decltype(make_tiled_copy(Copy_Atom<Trait_D, ElementD>{},
136137
Layout<CopyThreadShape>{},
137-
make_layout(shape_div(typename Trait_D::BlockShape{}, CopyThreadShape{}))));
138+
val_layout_store_D{}));
138139
private:
139140
constexpr static bool is_source_supported = not cute::is_void_v<ElementC>;
140141
constexpr static bool is_destination_supported = not cute::is_void_v<ElementD> && not cute::is_void_v<CopyOpR2G>;
141142

142143
using NonVoidElementC = conditional_t<is_source_supported, ElementC, ElementD>;
143144
using Trait_C = Copy_Traits<GmemTiledCopyC, InternalStrideC>;
144145
using NonVoidTrait_C = conditional_t<is_source_supported, Trait_C, Trait_D>;
146+
using val_layout_load_C = decltype(make_layout(shape_div(typename NonVoidTrait_C::BlockShape{}, CopyThreadShape{})));
147+
using NonVoidValLayoutLoad_C = conditional_t<is_source_supported, val_layout_load_C, val_layout_store_D>;
145148
using XE_Copy_C = decltype(make_tiled_copy(Copy_Atom<NonVoidTrait_C, NonVoidElementC>{},
146149
Layout<CopyThreadShape>{},
147-
make_layout(shape_div(typename NonVoidTrait_C::BlockShape{}, CopyThreadShape{}))));
150+
NonVoidValLayoutLoad_C{}));
148151
public:
149152

150153
using EmptyType = cute::tuple<>;

test/unit/gemm/device/xe_gemm_bf16_bf16_fp32_tensor_op_bf16.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/***************************************************************************************************
2-
* Copyright (c) 2025 - 2025 Codeplay Software Ltd. All rights reserved.
2+
* Copyright (C) 2025 Intel Corporation, All rights reserved.
33
* SPDX-License-Identifier: BSD-3-Clause
44
*
55
* Redistribution and use in source and binary forms, with or without
@@ -27,7 +27,7 @@
2727
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
2828
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
2929
*
30-
**************************************************************************************************/
30+
***************************************************************************************************/
3131

3232
/*! \file
3333
\brief Tests for Xe bf16_bf16_fp32 and C is bf16

0 commit comments

Comments
 (0)