Skip to content

Commit 4e0f032

Browse files
vladimirlazbb-sycl
authored andcommitted
[SYCL] Speed up atomic_ref tests (intel#879)
1 parent 8908920 commit 4e0f032

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

63 files changed

+719
-265
lines changed

SYCL/AtomicRef/add.cpp

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// See https://github.com/intel/llvm-test-suite/issues/867 for detailed status
34
// UNSUPPORTED: hip
45

@@ -152,6 +153,12 @@
152153

153154
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
154155
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
156+
=======
157+
// See https://github.com/intel/llvm-test-suite/issues/867 for detailed status
158+
// UNSUPPORTED: hip
159+
160+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-device-code-split=per_kernel -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
161+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
155162
// RUN: %HOST_RUN_PLACEHOLDER %t.out
156163
// RUN: %GPU_RUN_PLACEHOLDER %t.out
157164
// RUN: %CPU_RUN_PLACEHOLDER %t.out

SYCL/AtomicRef/add.h

Lines changed: 58 additions & 28 deletions
Original file line numberDiff line numberDiff line change
@@ -244,14 +244,19 @@ void add_test(queue q, size_t N) {
244244
constexpr bool do_ext_tests = space != access::address_space::generic_space;
245245
if constexpr (do_local_tests) {
246246
<<<<<<< HEAD
247+
<<<<<<< HEAD
247248
#ifdef RUN_DEPRECATED
248249
=======
249250
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
251+
=======
252+
#ifdef RUN_DEPRECATED
253+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
250254
if constexpr (do_ext_tests) {
251255
add_fetch_local_test<::sycl::ext::oneapi::atomic_ref, space, T,
252256
Difference, order, scope>(q, N);
253257
}
254258
<<<<<<< HEAD
259+
<<<<<<< HEAD
255260
#else
256261
add_fetch_local_test<::sycl::atomic_ref, space, T, Difference, order,
257262
scope>(q, N);
@@ -260,11 +265,19 @@ void add_test(queue q, size_t N) {
260265
if constexpr (do_global_tests) {
261266
#ifdef RUN_DEPRECATED
262267
=======
268+
=======
269+
#else
270+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
263271
add_fetch_local_test<::sycl::atomic_ref, space, T, Difference, order,
264272
scope>(q, N);
273+
#endif
265274
}
266275
if constexpr (do_global_tests) {
276+
<<<<<<< HEAD
267277
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
278+
=======
279+
#ifdef RUN_DEPRECATED
280+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
268281
if constexpr (do_ext_tests) {
269282
add_fetch_test<::sycl::ext::oneapi::atomic_ref, space, T, Difference,
270283
order, scope>(q, N);
@@ -278,9 +291,13 @@ void add_test(queue q, size_t N) {
278291
}
279292
}
280293
<<<<<<< HEAD
294+
<<<<<<< HEAD
281295
#else
282296
=======
283297
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
298+
=======
299+
#else
300+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
284301
add_fetch_test<::sycl::atomic_ref, space, T, Difference, order, scope>(q,
285302
N);
286303
add_plus_equal_test<::sycl::atomic_ref, space, T, Difference, order, scope>(
@@ -292,9 +309,13 @@ void add_test(queue q, size_t N) {
292309
q, N);
293310
}
294311
<<<<<<< HEAD
312+
<<<<<<< HEAD
295313
#endif
296314
=======
297315
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
316+
=======
317+
#endif
318+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
298319
}
299320
}
300321

@@ -303,6 +324,7 @@ template <access::address_space space, typename T, typename Difference = T,
303324
void add_test_scopes(queue q, size_t N) {
304325
std::vector<memory_scope> scopes =
305326
q.get_device().get_info<info::device::atomic_memory_scope_capabilities>();
327+
<<<<<<< HEAD
306328
<<<<<<< HEAD
307329
if (std::find(scopes.begin(), scopes.end(), memory_scope::system) !=
308330
scopes.end()) {
@@ -320,35 +342,33 @@ void add_test_scopes(queue q, size_t N) {
320342
=======
321343
#if defined(SYSTEM)
322344
if (std::find(scopes.begin(), scopes.end(), memory_scope::system) ==
345+
=======
346+
if (std::find(scopes.begin(), scopes.end(), memory_scope::system) !=
347+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
323348
scopes.end()) {
324-
std::cout << "Skipping test\n";
325-
return;
349+
add_test<space, T, Difference, order, memory_scope::system>(q, N);
326350
}
327-
add_test<space, T, Difference, order, memory_scope::system>(q, N);
328-
#elif defined(WORK_GROUP)
329-
if (std::find(scopes.begin(), scopes.end(), memory_scope::system) ==
351+
if (std::find(scopes.begin(), scopes.end(), memory_scope::work_group) !=
330352
scopes.end()) {
331-
std::cout << "Skipping test\n";
332-
return;
353+
add_test<space, T, Difference, order, memory_scope::work_group>(q, N);
333354
}
334-
add_test<space, T, Difference, order, memory_scope::work_group>(q, N);
335-
#elif defined(SUB_GROUP)
336-
if (std::find(scopes.begin(), scopes.end(), memory_scope::system) ==
355+
if (std::find(scopes.begin(), scopes.end(), memory_scope::sub_group) !=
337356
scopes.end()) {
338-
std::cout << "Skipping test\n";
339-
return;
357+
add_test<space, T, Difference, order, memory_scope::sub_group>(q, N);
340358
}
341-
add_test<space, T, Difference, order, memory_scope::sub_group>(q, N);
342-
#else
343359
add_test<space, T, Difference, order, memory_scope::device>(q, N);
360+
<<<<<<< HEAD
344361
#endif
345362
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
363+
=======
364+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
346365
}
347366

348367
template <access::address_space space, typename T, typename Difference = T>
349368
void add_test_orders_scopes(queue q, size_t N) {
350369
std::vector<memory_order> orders =
351370
q.get_device().get_info<info::device::atomic_memory_order_capabilities>();
371+
<<<<<<< HEAD
352372
<<<<<<< HEAD
353373
if (std::find(orders.begin(), orders.end(), memory_order::acq_rel) !=
354374
orders.end()) {
@@ -366,36 +386,34 @@ void add_test_orders_scopes(queue q, size_t N) {
366386
=======
367387
#if defined(ACQ_REL)
368388
if (std::find(orders.begin(), orders.end(), memory_order::acq_rel) ==
389+
=======
390+
if (std::find(orders.begin(), orders.end(), memory_order::acq_rel) !=
391+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
369392
orders.end()) {
370-
std::cout << "Skipping test\n";
371-
return;
393+
add_test_scopes<space, T, Difference, memory_order::acq_rel>(q, N);
372394
}
373-
add_test_scopes<space, T, Difference, memory_order::acq_rel>(q, N);
374-
#elif defined(ACQUIRE)
375-
if (std::find(orders.begin(), orders.end(), memory_order::acquire) ==
395+
if (std::find(orders.begin(), orders.end(), memory_order::acquire) !=
376396
orders.end()) {
377-
std::cout << "Skipping test\n";
378-
return;
397+
add_test_scopes<space, T, Difference, memory_order::acquire>(q, N);
379398
}
380-
add_test_scopes<space, T, Difference, memory_order::acquire>(q, N);
381-
#elif defined(RELEASE)
382-
if (std::find(orders.begin(), orders.end(), memory_order::release) ==
399+
if (std::find(orders.begin(), orders.end(), memory_order::release) !=
383400
orders.end()) {
384-
std::cout << "Skipping test\n";
385-
return;
401+
add_test_scopes<space, T, Difference, memory_order::release>(q, N);
386402
}
387-
add_test_scopes<space, T, Difference, memory_order::release>(q, N);
388-
#else
389403
add_test_scopes<space, T, Difference, memory_order::relaxed>(q, N);
404+
<<<<<<< HEAD
390405
#endif
391406
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
407+
=======
408+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
392409
}
393410

394411
template <access::address_space space> void add_test_all() {
395412
queue q;
396413

397414
constexpr int N = 32;
398415
<<<<<<< HEAD
416+
<<<<<<< HEAD
399417
#ifdef FULL_ATOMIC64_COVERAGE
400418
add_test_orders_scopes<space, double>(q, N);
401419
=======
@@ -408,6 +426,10 @@ template <access::address_space space> void add_test_all() {
408426
add_test_orders_scopes<space, double>(q, N);
409427
#ifndef FP_TESTS_ONLY
410428
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
429+
=======
430+
#ifdef FULL_ATOMIC64_COVERAGE
431+
add_test_orders_scopes<space, double>(q, N);
432+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
411433
if constexpr (sizeof(long) == 8) {
412434
add_test_orders_scopes<space, long>(q, N);
413435
add_test_orders_scopes<space, unsigned long>(q, N);
@@ -420,6 +442,7 @@ template <access::address_space space> void add_test_all() {
420442
add_test_orders_scopes<space, char *, ptrdiff_t>(q, N);
421443
}
422444
#endif
445+
<<<<<<< HEAD
423446
<<<<<<< HEAD
424447
add_test_orders_scopes<space, float>(q, N);
425448
#ifdef FULL_ATOMIC32_COVERAGE
@@ -428,6 +451,10 @@ template <access::address_space space> void add_test_all() {
428451
add_test_orders_scopes<space, float>(q, N);
429452
#ifndef FP_TESTS_ONLY
430453
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
454+
=======
455+
add_test_orders_scopes<space, float>(q, N);
456+
#ifdef FULL_ATOMIC32_COVERAGE
457+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
431458
add_test_orders_scopes<space, int>(q, N);
432459
add_test_orders_scopes<space, unsigned int>(q, N);
433460
if constexpr (sizeof(long) == 4) {
@@ -439,9 +466,12 @@ template <access::address_space space> void add_test_all() {
439466
}
440467
#endif
441468
<<<<<<< HEAD
469+
<<<<<<< HEAD
442470
=======
443471
#endif
444472

445473
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
474+
=======
475+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
446476
std::cout << "Test passed." << std::endl;
447477
}

SYCL/AtomicRef/add_generic.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
34
=======
45
// Each combination of 64/32 bit atomic, relaxed/acquire/release/acq_rel
@@ -148,6 +149,9 @@
148149
// RUN: %ACC_RUN_PLACEHOLDER %t.out
149150

150151
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
152+
=======
153+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
154+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
151155
// RUN: %HOST_RUN_PLACEHOLDER %t.out
152156
// RUN: %GPU_RUN_PLACEHOLDER %t.out
153157
// RUN: %CPU_RUN_PLACEHOLDER %t.out

SYCL/AtomicRef/add_generic_local.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
34
=======
45
// Each combination of 64/32 bit atomic, relaxed/acquire/release/acq_rel
@@ -146,6 +147,9 @@
146147

147148
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
148149
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
150+
=======
151+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
152+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
149153
// RUN: %HOST_RUN_PLACEHOLDER %t.out
150154
// RUN: %GPU_RUN_PLACEHOLDER %t.out
151155
// RUN: %CPU_RUN_PLACEHOLDER %t.out

SYCL/AtomicRef/add_generic_local_native_fp.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
34
=======
45
// Each combination of 64/32 bit atomic, relaxed/acquire/release/acq_rel
@@ -146,6 +147,9 @@
146147

147148
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
148149
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
150+
=======
151+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
152+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
149153
// RUN: %HOST_RUN_PLACEHOLDER %t.out
150154
// RUN: %GPU_RUN_PLACEHOLDER %t.out
151155
// RUN: %CPU_RUN_PLACEHOLDER %t.out

SYCL/AtomicRef/add_generic_native_fp.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
34
=======
45
// Each combination of 64/32 bit atomic, relaxed/acquire/release/acq_rel
@@ -146,6 +147,9 @@
146147

147148
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
148149
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
150+
=======
151+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
152+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
149153
// RUN: %HOST_RUN_PLACEHOLDER %t.out
150154
// RUN: %GPU_RUN_PLACEHOLDER %t.out
151155
// RUN: %CPU_RUN_PLACEHOLDER %t.out

SYCL/AtomicRef/add_local.cpp

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
34
=======
45
// Each combination of 64/32 bit atomic, relaxed/acquire/release/acq_rel
@@ -146,11 +147,15 @@
146147

147148
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
148149
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
150+
=======
151+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
152+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
149153
// RUN: %HOST_RUN_PLACEHOLDER %t.out
150154
// RUN: %GPU_RUN_PLACEHOLDER %t.out
151155
// RUN: %CPU_RUN_PLACEHOLDER %t.out
152156
// RUN: %ACC_RUN_PLACEHOLDER %t.out
153157

158+
<<<<<<< HEAD
154159
<<<<<<< HEAD
155160
// Barrier is not supported on host. HIP and ACC do not support floating
156161
// point atomics.
@@ -160,6 +165,11 @@
160165
// point atomics.
161166
// XFAIL: host, hip, opencl
162167
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
168+
=======
169+
// Barrier is not supported on host. HIP and ACC do not support floating
170+
// point atomics.
171+
// XFAIL: host, hip, acc
172+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
163173

164174
#include "add.h"
165175

SYCL/AtomicRef/add_local_native_fp.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
34
=======
45
// Each combination of 64/32 bit atomic, relaxed/acquire/release/acq_rel
@@ -146,6 +147,9 @@
146147

147148
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
148149
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
150+
=======
151+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
152+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
149153
// RUN: %HOST_RUN_PLACEHOLDER %t.out
150154
// RUN: %GPU_RUN_PLACEHOLDER %t.out
151155
// RUN: %CPU_RUN_PLACEHOLDER %t.out

SYCL/AtomicRef/add_native_fp.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
34
=======
45
// Each combination of 64/32 bit atomic, relaxed/acquire/release/acq_rel
@@ -146,6 +147,9 @@
146147

147148
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
148149
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
150+
=======
151+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
152+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
149153
// RUN: %HOST_RUN_PLACEHOLDER %t.out
150154
// RUN: %GPU_RUN_PLACEHOLDER %t.out
151155
// RUN: %CPU_RUN_PLACEHOLDER %t.out

SYCL/AtomicRef/and.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
<<<<<<< HEAD
2+
<<<<<<< HEAD
23
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
34
=======
45
// Each combination of 64/32 bit atomic, relaxed/acquire/release/acq_rel
@@ -146,6 +147,9 @@
146147

147148
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70 -DACQ_REL -DSYSTEM -DATOMIC64
148149
>>>>>>> 88ee9d1a0 ([SYCL] Add tests for atomics with various memory orders and scopes (#534))
150+
=======
151+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
152+
>>>>>>> a5f90c0cd ([SYCL] Speed up atomic_ref tests (#879))
149153
// RUN: %HOST_RUN_PLACEHOLDER %t.out
150154
// RUN: %GPU_RUN_PLACEHOLDER %t.out
151155
// RUN: %CPU_RUN_PLACEHOLDER %t.out

0 commit comments

Comments
 (0)