@@ -1015,7 +1015,7 @@ struct subgroup_radix_sort
1015
1015
template <typename ValueT, typename OutputT, typename ProjT>
1016
1016
sycl::event operator ()(sycl::queue &exec_q,
1017
1017
size_t n_iters,
1018
- size_t n_values ,
1018
+ size_t n_to_sort ,
1019
1019
ValueT *input_ptr,
1020
1020
OutputT *output_ptr,
1021
1021
ProjT proj_op,
@@ -1038,7 +1038,8 @@ struct subgroup_radix_sort
1038
1038
std::min<std::size_t >(n_iters, max_concurrent_work_groups);
1039
1039
1040
1040
// determine which temporary allocation can be accommodated in SLM
1041
- const auto &SLM_availability = check_slm_size<ValueT>(exec_q, n_values);
1041
+ const auto &SLM_availability =
1042
+ check_slm_size<ValueT>(exec_q, n_to_sort);
1042
1043
1043
1044
const std::size_t n_batch_size = n_work_groups;
1044
1045
@@ -1049,7 +1050,7 @@ struct subgroup_radix_sort
1049
1050
constexpr auto storage_for_counters = use_slm_tag{};
1050
1051
1051
1052
return one_group_submitter<_SortKernelLoc>()(
1052
- exec_q, n_iters, n_iters, n_values , input_ptr, output_ptr,
1053
+ exec_q, n_iters, n_iters, n_to_sort , input_ptr, output_ptr,
1053
1054
proj_op, is_ascending, storage_for_values, storage_for_counters,
1054
1055
depends);
1055
1056
}
@@ -1059,7 +1060,7 @@ struct subgroup_radix_sort
1059
1060
constexpr auto storage_for_counters = use_slm_tag{};
1060
1061
1061
1062
return one_group_submitter<_SortKernelPartGlob>()(
1062
- exec_q, n_iters, n_batch_size, n_values , input_ptr, output_ptr,
1063
+ exec_q, n_iters, n_batch_size, n_to_sort , input_ptr, output_ptr,
1063
1064
proj_op, is_ascending, storage_for_values, storage_for_counters,
1064
1065
depends);
1065
1066
}
@@ -1069,7 +1070,7 @@ struct subgroup_radix_sort
1069
1070
constexpr auto storage_for_counters = use_global_mem_tag{};
1070
1071
1071
1072
return one_group_submitter<_SortKernelGlob>()(
1072
- exec_q, n_iters, n_batch_size, n_values , input_ptr, output_ptr,
1073
+ exec_q, n_iters, n_batch_size, n_to_sort , input_ptr, output_ptr,
1073
1074
proj_op, is_ascending, storage_for_values, storage_for_counters,
1074
1075
depends);
1075
1076
}
0 commit comments