Skip to content

Commit f25053f

Browse files
binary_contig_impl to use template params to set vec_sz and n_vec as unary_contig_impl does
1 parent 94d2159 commit f25053f

File tree

1 file changed

+3
-3
lines changed
  • dpctl/tensor/libtensor/include/kernels/elementwise_functions

1 file changed

+3
-3
lines changed

dpctl/tensor/libtensor/include/kernels/elementwise_functions/common.hpp

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -705,7 +705,9 @@ template <typename argTy1,
705705
typename T3,
706706
unsigned int vs,
707707
unsigned int nv>
708-
class kernel_name>
708+
class kernel_name,
709+
unsigned int vec_sz = 4,
710+
unsigned int n_vecs = 2>
709711
sycl::event binary_contig_impl(sycl::queue exec_q,
710712
size_t nelems,
711713
const char *arg1_p,
@@ -720,8 +722,6 @@ sycl::event binary_contig_impl(sycl::queue exec_q,
720722
cgh.depends_on(depends);
721723

722724
size_t lws = 64;
723-
constexpr unsigned int vec_sz = 4;
724-
constexpr unsigned int n_vecs = 2;
725725
const size_t n_groups =
726726
((nelems + lws * n_vecs * vec_sz - 1) / (lws * n_vecs * vec_sz));
727727
const auto gws_range = sycl::range<1>(n_groups * lws);

0 commit comments

Comments
 (0)