@@ -1269,9 +1269,10 @@ void reduCGFuncImpl(handler &CGH, KernelType KernelFunc,
1269
1269
auto IdentitiesTuple = getReduIdentities (ReduTuple, ReduIndices);
1270
1270
auto BOPsTuple = getReduBOPs (ReduTuple, ReduIndices);
1271
1271
1272
- using Name = typename get_reduction_main_kernel_name_t <
1273
- KernelName, KernelType, UniformPow2WG, IsOneWG,
1274
- std::tuple<Reductions...>>::name;
1272
+ using Name =
1273
+ typename get_reduction_main_kernel_name_t <KernelName, KernelType,
1274
+ UniformPow2WG, IsOneWG,
1275
+ decltype (OutAccsTuple)>::name;
1275
1276
CGH.parallel_for <Name>(Range, [=](nd_item<Dims> NDIt) {
1276
1277
auto ReduIndices = std::index_sequence_for<Reductions...>();
1277
1278
auto ReducersTuple =
@@ -1403,7 +1404,7 @@ void reduAuxCGFuncImpl(handler &CGH, size_t NWorkItems, size_t NWorkGroups,
1403
1404
using Name =
1404
1405
typename get_reduction_aux_kernel_name_t <KernelName, KernelType,
1405
1406
UniformPow2WG, IsOneWG,
1406
- std::tuple<Reductions...> >::name;
1407
+ decltype (OutAccsTuple) >::name;
1407
1408
range<1 > GlobalRange = {UniformPow2WG ? NWorkItems : NWorkGroups * WGSize};
1408
1409
nd_range<1 > Range{GlobalRange, range<1 >(WGSize)};
1409
1410
CGH.parallel_for <Name>(Range, [=](nd_item<1 > NDIt) {
0 commit comments