|
21 | 21 | using namespace cl::sycl;
|
22 | 22 |
|
23 | 23 | int main(void) {
|
| 24 | + constexpr unsigned Size = 1024 * 128; |
| 25 | + constexpr unsigned VL = 16; |
| 26 | + |
| 27 | + float *A = new float[Size]; |
| 28 | + float *B = new float[Size]; |
| 29 | + float *C = new float[Size]; |
| 30 | + |
| 31 | + for (unsigned i = 0; i < Size; ++i) { |
| 32 | + A[i] = B[i] = i; |
| 33 | + C[i] = 0.0f; |
| 34 | + } |
| 35 | + |
24 | 36 | try {
|
25 |
| - int data = 0; |
| 37 | + buffer<float, 1> bufa(A, range<1>(Size)); |
| 38 | + buffer<float, 1> bufb(B, range<1>(Size)); |
| 39 | + buffer<float, 1> bufc(C, range<1>(Size)); |
| 40 | + |
| 41 | + // We need that many workgroups |
| 42 | + range<1> GlobalRange{Size / VL}; |
| 43 | + |
| 44 | + // We need that many threads in each group |
| 45 | + range<1> LocalRange{1}; |
| 46 | + |
26 | 47 | queue q(esimd_test::ESIMDSelector{}, esimd_test::createExceptionHandler());
|
27 | 48 |
|
28 | 49 | auto dev = q.get_device();
|
29 | 50 | std::cout << "Running on " << dev.get_info<info::device::name>() << "\n";
|
30 | 51 |
|
31 |
| - cl::sycl::buffer<int, 1> buf(&data, cl::sycl::range<1>(1)); |
32 | 52 | auto e = q.submit([&](handler &cgh) {
|
33 |
| - auto acc = buf.get_access<cl::sycl::access::mode::read_write>(cgh); |
34 |
| - cgh.single_task<class Test>([=] { acc[0] += 1; }); |
| 53 | + auto PA = bufa.get_access<access::mode::read>(cgh); |
| 54 | + auto PB = bufb.get_access<access::mode::read>(cgh); |
| 55 | + auto PC = bufc.get_access<access::mode::write>(cgh); |
| 56 | + cgh.parallel_for<class Test>( |
| 57 | + GlobalRange * LocalRange, [=](id<1> i) SYCL_ESIMD_KERNEL { |
| 58 | + using namespace sycl::ext::intel::experimental::esimd; |
| 59 | + unsigned int offset = i * VL * sizeof(float); |
| 60 | + simd<float, VL> va; |
| 61 | + va.copy_from(PA, offset); |
| 62 | + simd<float, VL> vb; |
| 63 | + vb.copy_from(PB, offset); |
| 64 | + simd<float, VL> vc = va + vb; |
| 65 | + vc.copy_to(PC, offset); |
| 66 | + }); |
35 | 67 | });
|
36 | 68 | e.wait();
|
37 | 69 | } catch (sycl::exception const &e) {
|
38 | 70 | std::cout << "SYCL exception caught: " << e.what() << '\n';
|
| 71 | + |
| 72 | + delete[] A; |
| 73 | + delete[] B; |
| 74 | + delete[] C; |
39 | 75 | return 1;
|
40 | 76 | }
|
41 |
| - return 0; |
| 77 | + |
| 78 | + int err_cnt = 0; |
| 79 | + |
| 80 | + for (unsigned i = 0; i < Size; ++i) { |
| 81 | + if (A[i] + B[i] != C[i]) { |
| 82 | + if (++err_cnt < 10) { |
| 83 | + std::cout << "failed at index " << i << ", " << C[i] << " != " << A[i] |
| 84 | + << " + " << B[i] << "\n"; |
| 85 | + } |
| 86 | + } |
| 87 | + } |
| 88 | + if (err_cnt > 0) { |
| 89 | + std::cout << " pass rate: " |
| 90 | + << ((float)(Size - err_cnt) / (float)Size) * 100.0f << "% (" |
| 91 | + << (Size - err_cnt) << "/" << Size << ")\n"; |
| 92 | + } |
| 93 | + |
| 94 | + delete[] A; |
| 95 | + delete[] B; |
| 96 | + delete[] C; |
| 97 | + |
| 98 | + std::cout << (err_cnt > 0 ? "FAILED\n" : "Passed\n"); |
| 99 | + return err_cnt > 0 ? 1 : 0; |
42 | 100 | }
|
43 | 101 |
|
44 | 102 | // CHECK: ---> piProgramBuild(
|
|
0 commit comments