We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 323a791 commit 2ea75e0Copy full SHA for 2ea75e0
dpctl/tensor/libtensor/include/kernels/reductions.hpp
@@ -977,7 +977,10 @@ sycl::event reduction_over_group_temps_strided_impl(
977
size_t wg = choose_workgroup_size<4>(reduction_nelems, sg_sizes);
978
979
constexpr size_t preferrered_reductions_per_wi = 4;
980
- size_t max_wg = d.get_info<sycl::info::device::max_work_group_size>();
+ // max_max_wg prevents running out of resources on CPU
981
+ constexpr size_t max_max_wg = 2048;
982
+ size_t max_wg = std::min(
983
+ max_max_wg, d.get_info<sycl::info::device::max_work_group_size>());
984
985
size_t reductions_per_wi(preferrered_reductions_per_wi);
986
if (reduction_nelems <= preferrered_reductions_per_wi * max_wg) {
0 commit comments