Skip to content
This repository was archived by the owner on Mar 28, 2023. It is now read-only.

Commit 5d4c073

Browse files
authored
Merge branch 'intel' into private/MrSidims/UpdateCODEOWNERS
2 parents 1c1d166 + 0f3052b commit 5d4c073

File tree

480 files changed

+14865
-3846
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

480 files changed

+14865
-3846
lines changed

.github/CODEOWNERS

Lines changed: 20 additions & 71 deletions
Original file line numberDiff line numberDiff line change
@@ -1,86 +1,35 @@
11
* @vladimirlaz @romanovvlad @bader
22

3-
# AOT compilation
4-
SYCL/AOT @AGindinson @dm-vodopyanov @AlexeySachkov @romanovvlad
3+
# Use runtime team as the umbrella for most of the tests
4+
/SYCL/ @intel/llvm-reviewers-runtime
55

6-
# Atomics
7-
SYCL/AtomicRef @AGindinson
86

9-
# SYCL RT specific tests
10-
SYCL/Assert @intel/llvm-reviewers-runtime
11-
SYCL/Basic @intel/llvm-reviewers-runtime
12-
SYCL/Config @intel/llvm-reviewers-runtime
13-
SYCL/DiscardEvents @intel/llvm-reviewers-runtime
14-
SYCL/FilterSelector @intel/llvm-reviewers-runtime
15-
SYCL/HostInteropTask @intel/llvm-reviewers-runtime
16-
SYCL/InorderQueue @intel/llvm-reviewers-runtime
17-
SYCL/KernelAndProgram @intel/llvm-reviewers-runtime
18-
SYCL/KernelParams @intel/llvm-reviewers-runtime
19-
SYCL/Scheduler @intel/llvm-reviewers-runtime
20-
SYCL/Tracing @intel/llvm-reviewers-runtime
21-
22-
# Device code split
23-
SYCL/DeviceCodeSplit @AlexeySachkov @Fznamznon
24-
25-
# Device library
26-
SYCL/DeviceLib @vzakhari
27-
SYCL/DeviceLib/ITTAnnotations @vzakhari @MrSidims @AGindinson
28-
29-
# dot_product API
30-
SYCL/DotProduct @rdeodhar
31-
32-
# Explicit SIMD
33-
SYCL/ESIMD @kbobrovs @v-klochkov @sndmitriev
34-
35-
# Functor
36-
SYCL/Functor @AlexeySachkov
7+
# SYCL sub-directory matchers are grouped by code owner first, followed by
8+
# alphabetical order within the group. Please, keep this ordering.
379

3810
# Group algorithms
39-
SYCL/GroupAlgorithm @Pennycook @AlexeySachkov
40-
SYCL/SubGroup @Pennycook @AlexeySachkov
41-
SYCL/SubGroupMask @Pennycook @vladimirlaz
4211

43-
# Group local memory
44-
SYCL/GroupLocalMemory @sergey-semenov @Pennycook
12+
/SYCL/GroupAlgorithm/ @Pennycook @intel/llvm-reviewers-runtime
13+
/SYCL/GroupLocalMemory/ @Pennycook @intel/llvm-reviewers-runtime
14+
/SYCL/SubGroup/ @Pennycook @intel/llvm-reviewers-runtime
15+
/SYCL/SubGroupMask/ @Pennycook @intel/llvm-reviewers-runtime
4516

46-
# Hierarchical parallelism
47-
SYCL/HierPar @kbobrovs
17+
# Plugin interface for Level Zero
18+
/SYCL/Plugin/*level[-_]zero* @intel/dpcpp-l0-pi-reviewers
4819

49-
# Inline assembler
50-
SYCL/InlineAsm @AlexeySachkov
20+
# Explicit SIMD
21+
/SYCL/ESIMD/ @intel/dpcpp-esimd-reviewers
5122

52-
# Online compiler
53-
SYCL/OnlineCompiler @v-klochkov
23+
# BFloat16 conversion
24+
/SYCL/BFloat16/ @AlexeySotkin @intel/dpcpp-tools-reviewers
5425

55-
# Plugin interface
56-
SYCL/Plugin @smaslov-intel
26+
# Compiler tests
27+
/SYCL/AOT/ @intel/dpcpp-tools-reviewers
28+
/SYCL/DeviceCodeSplit/ @intel/dpcpp-tools-reviewers
29+
/SYCL/SeparateCompile/ @intel/dpcpp-tools-reviewers
5730

5831
# Printf
59-
SYCL/Printf @AlexeySachkov @AGindinson @mlychkov
60-
61-
# Reduction algorithms
62-
SYCL/Reduction @v-klochkov
63-
64-
# Image sampler
65-
SYCL/Sampler @cperkinsintel
66-
67-
# Separate compilation
68-
SYCL/SeparateCompile @AlexeySachkov @Fznamznon
32+
/SYCL/Printf/ @intel/dpcpp-tools-reviewers
6933

7034
# Specialization constant
71-
SYCL/SpecConstants @kbobrovs
72-
73-
# Unified Shared Memory (USM)
74-
SYCL/USM @jbrodman @sergey-semenov
75-
76-
# Stream
77-
SYCL/Basic/stream @againull
78-
79-
#BFloat16 conversion
80-
SYCL/BFloat16 @MrSidims
81-
82-
# Deprecated features
83-
SYCL/DeprecatedFeatures @intel/llvm-reviewers-runtime
84-
85-
# XPTI and XPTI Framework
86-
SYCL/XPTI @intel/llvm-reviewers-runtime
35+
/SYCL/SpecConstants/ @intel/dpcpp-tools-reviewers

.github/workflows/clang-format.yml

Lines changed: 8 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -8,22 +8,21 @@ on:
88
jobs:
99
build:
1010
runs-on: ubuntu-latest
11-
steps:
12-
- name: Get clang-format first
13-
run: sudo apt-get install -yqq clang-format-9
1411

12+
container:
13+
image: ghcr.io/intel/llvm/sycl_ubuntu2004_nightly:no-drivers
14+
15+
steps:
1516
- uses: actions/checkout@v2
1617
with:
1718
fetch-depth: 2
18-
19-
- name: Get clang-format-diff.py tool
20-
run: |
21-
wget https://raw.githubusercontent.com/intel/llvm/sycl/clang/tools/clang-format/clang-format-diff.py
22-
chmod u+x clang-format-diff.py
2319

2420
- name: Run clang-format for the patch
21+
shell: bash {0}
2522
run: |
26-
git diff -U0 --no-color ${GITHUB_SHA}^1 ${GITHUB_SHA} -- | python clang-format-diff.py -p1 -binary clang-format-9 > ./clang-format.patch
23+
git clang-format ${GITHUB_SHA}^1
24+
git diff > ./clang-format.patch
25+
2726
# Add patch with formatting fixes to CI job artifacts
2827
- uses: actions/upload-artifact@v1
2928
with:

.gitignore

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,3 +2,4 @@
22
# External/*
33
/test-suite-externals
44
*.pyc
5+
/build*

SYCL/AOT/accelerator.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,12 @@
1-
//==--- accelerator.cpp - AOT compilation for fpga devices using aoc ------==//
1+
//=-- accelerator.cpp - compilation for fpga emulator dev using opencl-aot --=//
22
//
33
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
44
// See https://llvm.org/LICENSE.txt for license information.
55
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
66
//
77
//===---------------------------------------------------------------------===//
88

9-
// REQUIRES: aoc, accelerator
9+
// REQUIRES: opencl-aot, accelerator
1010

1111
// RUN: %clangxx -fsycl -fsycl-targets=spir64_fpga %S/Inputs/aot.cpp -o %t.out
1212
// RUN: %ACC_RUN_PLACEHOLDER %t.out

SYCL/AOT/multiple-devices.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66
//
77
//===----------------------------------------------------------------------===//
88

9-
// REQUIRES: opencl-aot, ocloc, aoc, cpu, gpu, accelerator
9+
// REQUIRES: opencl-aot, ocloc, cpu, gpu, accelerator
1010
// UNSUPPORTED: cuda
1111
// CUDA is not compatible with SPIR.
1212

SYCL/Assert/assert_in_kernels.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
// REQUIRES: linux
22
// FIXME unsupported on CUDA and HIP until fallback libdevice becomes available
33
// UNSUPPORTED: cuda || hip
4-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
4+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
55
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
66
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
77
// RUN: %GPU_RUN_PLACEHOLDER %t.out &> %t.txt || true

SYCL/Assert/assert_in_kernels_win.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// REQUIRES: windows
22
// UNSUPPORTED: cuda || hip
3-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
3+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
44
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
55
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
66
// RUN: %GPU_RUN_PLACEHOLDER %t.out &> %t.txt || true

SYCL/Assert/assert_in_multiple_tus.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
// REQUIRES: linux
22
// FIXME unsupported on CUDA and HIP until fallback libdevice becomes available
33
// UNSUPPORTED: cuda || hip
4-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple -I %S/Inputs %s %S/Inputs/kernels_in_file2.cpp -o %t.out
4+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple -I %S/Inputs %s %S/Inputs/kernels_in_file2.cpp -o %t.out
55
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
66
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
77
// RUN: %GPU_RUN_PLACEHOLDER %t.out &> %t.txt || true

SYCL/Assert/assert_in_multiple_tus_one_ndebug.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
// REQUIRES: linux
22
// FIXME unsupported on CUDA and HIP until fallback libdevice becomes available
33
// UNSUPPORTED: cuda || hip
4-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple -DDEFINE_NDEBUG_INFILE2 -I %S/Inputs %S/assert_in_multiple_tus.cpp %S/Inputs/kernels_in_file2.cpp -o %t.out
4+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple -DDEFINE_NDEBUG_INFILE2 -I %S/Inputs %S/assert_in_multiple_tus.cpp %S/Inputs/kernels_in_file2.cpp -o %t.out
55
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
66
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
77
// RUN: %GPU_RUN_PLACEHOLDER %t.out &> %t.txt || true

SYCL/Assert/assert_in_multiple_tus_one_ndebug_win.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// REQUIRES: windows
22
// UNSUPPORTED: cuda || hip
3-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple -DDEFINE_NDEBUG_INFILE2 -I %S/Inputs %S/assert_in_multiple_tus.cpp %S/Inputs/kernels_in_file2.cpp -o %t.out
3+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple -DDEFINE_NDEBUG_INFILE2 -I %S/Inputs %S/assert_in_multiple_tus.cpp %S/Inputs/kernels_in_file2.cpp -o %t.out
44
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
55
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
66
// RUN: %GPU_RUN_PLACEHOLDER %t.out &> %t.txt || true

SYCL/Assert/assert_in_multiple_tus_win.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// REQUIRES: windows
22
// UNSUPPORTED: cuda || hip
3-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple -I %S/Inputs %s %S/Inputs/kernels_in_file2.cpp -o %t.out
3+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple -I %S/Inputs %s %S/Inputs/kernels_in_file2.cpp -o %t.out
44
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
55
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
66
// RUN: %GPU_RUN_PLACEHOLDER %t.out &> %t.txt || true

SYCL/Assert/assert_in_one_kernel.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
// REQUIRES: linux
22
// FIXME unsupported on CUDA and HIP until fallback libdevice becomes available
33
// UNSUPPORTED: cuda || hip
4-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
4+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
55
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
66
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
77
// RUN: %GPU_RUN_PLACEHOLDER %t.out &> %t.txt || true

SYCL/Assert/assert_in_one_kernel_win.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// REQUIRES: windows
22
// UNSUPPORTED: cuda || hip
3-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
3+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple %s -o %t.out
44
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
55
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
66
// RUN: %GPU_RUN_PLACEHOLDER %t.out &> %t.txt || true

SYCL/Assert/assert_in_simultaneous_kernels.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
// REQUIRES: linux
22
// FIXME unsupported on CUDA and HIP until fallback libdevice becomes available
33
// UNSUPPORTED: cuda || hip
4-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple %s -o %t.out %threads_lib
4+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple %s -o %t.out %threads_lib
55
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
66
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
77
//

SYCL/Assert/assert_in_simultaneous_kernels_win.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// REQUIRES: windows
22
// UNSUPPORTED: cuda || hip
3-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple %s -o %t.out %threads_lib
3+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple %s -o %t.out %threads_lib
44
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
55
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
66
//

SYCL/Assert/assert_in_simultaneously_multiple_tus.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// FIXME unsupported on CUDA and HIP until fallback libdevice becomes available
22
// UNSUPPORTED: cuda || hip
3-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple -I %S/Inputs %s %S/Inputs/kernels_in_file2.cpp -o %t.out %threads_lib
3+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple -I %S/Inputs %s %S/Inputs/kernels_in_file2.cpp -o %t.out %threads_lib
44
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
55
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
66
//

SYCL/Assert/assert_in_simultaneously_multiple_tus_one_ndebug.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// FIXME unsupported on CUDA and HIP until fallback libdevice becomes available
22
// UNSUPPORTED: cuda || hip
3-
// RUN: %clangxx -DSYCL_ENABLE_FALLBACK_ASSERT -fsycl -fsycl-targets=%sycl_triple -DDEFINE_NDEBUG_INFILE2 -I %S/Inputs %S/assert_in_simultaneously_multiple_tus.cpp %S/Inputs/kernels_in_file2.cpp -o %t.out %threads_lib
3+
// RUN: %clangxx -DSYCL_FALLBACK_ASSERT=1 -fsycl -fsycl-targets=%sycl_triple -DDEFINE_NDEBUG_INFILE2 -I %S/Inputs %S/assert_in_simultaneously_multiple_tus.cpp %S/Inputs/kernels_in_file2.cpp -o %t.out %threads_lib
44
// RUN: %CPU_RUN_PLACEHOLDER %t.out &> %t.txt || true
55
// RUN: %CPU_RUN_PLACEHOLDER FileCheck %s --input-file %t.txt
66
//

SYCL/AtomicRef/add.cpp

Lines changed: 5 additions & 37 deletions
Original file line numberDiff line numberDiff line change
@@ -1,44 +1,12 @@
1-
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-targets=%sycl_triple %s -o %t.out \
2-
// RUN: -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_60
1+
// See https://github.com/intel/llvm-test-suite/issues/867 for detailed status
2+
// UNSUPPORTED: hip
3+
4+
// RUN: %clangxx -fsycl -fsycl-unnamed-lambda -fsycl-device-code-split=per_kernel -fsycl-targets=%sycl_triple %s -o %t.out -Xsycl-target-backend=nvptx64-nvidia-cuda --cuda-gpu-arch=sm_70
35
// RUN: %HOST_RUN_PLACEHOLDER %t.out
46
// RUN: %GPU_RUN_PLACEHOLDER %t.out
57
// RUN: %CPU_RUN_PLACEHOLDER %t.out
68
// RUN: %ACC_RUN_PLACEHOLDER %t.out
79

810
#include "add.h"
9-
#include <iostream>
10-
using namespace sycl;
11-
12-
// Floating-point types do not support pre- or post-increment
13-
template <> void add_test<float>(queue q, size_t N) {
14-
add_fetch_test<::sycl::ext::oneapi::atomic_ref,
15-
access::address_space::global_space, float>(q, N);
16-
add_fetch_test<::sycl::atomic_ref, access::address_space::global_space,
17-
float>(q, N);
18-
add_plus_equal_test<::sycl::ext::oneapi::atomic_ref,
19-
access::address_space::global_space, float>(q, N);
20-
add_plus_equal_test<::sycl::atomic_ref, access::address_space::global_space,
21-
float>(q, N);
22-
}
23-
24-
int main() {
25-
queue q;
26-
27-
constexpr int N = 32;
28-
add_test<int>(q, N);
29-
add_test<unsigned int>(q, N);
30-
add_test<float>(q, N);
31-
32-
// Include long tests if they are 32 bits wide
33-
if constexpr (sizeof(long) == 4) {
34-
add_test<long>(q, N);
35-
add_test<unsigned long>(q, N);
36-
}
37-
38-
// Include pointer tests if they are 32 bits wide
39-
if constexpr (sizeof(char *) == 4) {
40-
add_test<char *, ptrdiff_t>(q, N);
41-
}
4211

43-
std::cout << "Test passed." << std::endl;
44-
}
12+
int main() { add_test_all<access::address_space::global_space>(); }

0 commit comments

Comments
 (0)