|
43 | 43 | _DataType_output* result = reinterpret_cast<_DataType_output*>(result1); \
|
44 | 44 | \
|
45 | 45 | cl::sycl::range<1> gws(size); \
|
46 |
| - event = DPNP_QUEUE.submit([&](cl::sycl::handler& cgh) { \ |
47 |
| - cgh.parallel_for<class custom_elemwise_##__name__##_c_kernel<_DataType_input> >( \ |
48 |
| - gws, \ |
49 |
| - [=](cl::sycl::id<1> global_id) \ |
| 46 | + auto kernel_parallel_for_func = [=](cl::sycl::id<1> global_id) { \ |
| 47 | + size_t i = global_id[0]; /*for (size_t i = 0; i < size; ++i)*/ \ |
50 | 48 | { \
|
51 |
| - size_t i = global_id[0]; /*for (size_t i = 0; i < size; ++i)*/ \ |
52 |
| - { \ |
53 |
| - _DataType_output input_elem = array1[i]; \ |
54 |
| - result[i] = __operation__; \ |
55 |
| - } \ |
56 |
| - }); /* parallel_for */ \ |
57 |
| - }); /* queue.submit */ \ |
| 49 | + _DataType_output input_elem = array1[i]; \ |
| 50 | + result[i] = __operation__; \ |
| 51 | + } \ |
| 52 | + }; \ |
| 53 | + \ |
| 54 | + auto kernel_func = [&](cl::sycl::handler& cgh) { \ |
| 55 | + cgh.parallel_for<class custom_elemwise_##__name__##_c_kernel<_DataType_input> >( \ |
| 56 | + gws, kernel_parallel_for_func); \ |
| 57 | + }; \ |
| 58 | + \ |
| 59 | + event = DPNP_QUEUE.submit(kernel_func); \ |
58 | 60 | \
|
59 | 61 | event.wait(); \
|
60 | 62 | } \
|
|
79 | 81 | _DataType* result = reinterpret_cast<_DataType*>(result1); \
|
80 | 82 | \
|
81 | 83 | cl::sycl::range<1> gws(size); \
|
82 |
| - event = DPNP_QUEUE.submit([&](cl::sycl::handler& cgh) { \ |
83 |
| - cgh.parallel_for<class custom_elemwise_##__name__##_c_kernel<_DataType> >( \ |
84 |
| - gws, \ |
85 |
| - [=](cl::sycl::id<1> global_id) \ |
| 84 | + auto kernel_parallel_for_func = [=](cl::sycl::id<1> global_id) { \ |
| 85 | + size_t i = global_id[0]; /*for (size_t i = 0; i < size; ++i)*/ \ |
86 | 86 | { \
|
87 |
| - size_t i = global_id[0]; /*for (size_t i = 0; i < size; ++i)*/ \ |
88 |
| - { \ |
89 |
| - _DataType input_elem = array1[i]; \ |
90 |
| - result[i] = __operation__; \ |
91 |
| - } \ |
92 |
| - }); /* parallel_for */ \ |
93 |
| - }); /* queue.submit */ \ |
| 87 | + _DataType input_elem = array1[i]; \ |
| 88 | + result[i] = __operation__; \ |
| 89 | + } \ |
| 90 | + }; \ |
| 91 | + \ |
| 92 | + auto kernel_func = [&](cl::sycl::handler& cgh) { \ |
| 93 | + cgh.parallel_for<class custom_elemwise_##__name__##_c_kernel<_DataType> >(gws, kernel_parallel_for_func); \ |
| 94 | + }; \ |
| 95 | + \ |
| 96 | + event = DPNP_QUEUE.submit(kernel_func); \ |
94 | 97 | \
|
95 | 98 | event.wait(); \
|
96 | 99 | } \
|
|
118 | 121 | _DataType_output* result = reinterpret_cast<_DataType_output*>(result1); \
|
119 | 122 | \
|
120 | 123 | cl::sycl::range<1> gws(size); \
|
121 |
| - event = DPNP_QUEUE.submit([&](cl::sycl::handler& cgh) { \ |
122 |
| - cgh.parallel_for<class custom_elemwise_##__name__##_c_kernel<_DataType_input1, _DataType_input2, _DataType_output> >( \ |
123 |
| - gws, \ |
124 |
| - [=](cl::sycl::id<1> global_id) \ |
| 124 | + auto kernel_parallel_for_func = [=](cl::sycl::id<1> global_id) { \ |
| 125 | + size_t i = global_id[0]; /*for (size_t i = 0; i < size; ++i)*/ \ |
125 | 126 | { \
|
126 |
| - size_t i = global_id[0]; /*for (size_t i = 0; i < size; ++i)*/ \ |
127 |
| - { \ |
128 |
| - _DataType_output input_elem1 = array1[i]; \ |
129 |
| - _DataType_output input_elem2 = array2[i]; \ |
130 |
| - result[i] = __operation__; \ |
131 |
| - } \ |
132 |
| - }); /* parallel_for */ \ |
133 |
| - }); /* queue.submit */ \ |
| 127 | + _DataType_output input_elem1 = array1[i]; \ |
| 128 | + _DataType_output input_elem2 = array2[i]; \ |
| 129 | + result[i] = __operation__; \ |
| 130 | + } \ |
| 131 | + }; \ |
| 132 | + \ |
| 133 | + auto kernel_func = [&](cl::sycl::handler& cgh) { \ |
| 134 | + cgh.parallel_for<class custom_elemwise_##__name__##_c_kernel<_DataType_input1, _DataType_input2, _DataType_output> >( \ |
| 135 | + gws, kernel_parallel_for_func); \ |
| 136 | + }; \ |
| 137 | + \ |
| 138 | + event = DPNP_QUEUE.submit(kernel_func); \ |
134 | 139 | \
|
135 | 140 | event.wait(); \
|
136 | 141 | } \
|
|
0 commit comments