Skip to content
This repository was archived by the owner on Mar 28, 2023. It is now read-only.

Commit 0ede881

Browse files
committed
format
Signed-off-by: JackAKirk <[email protected]>
1 parent 5ea081a commit 0ede881

File tree

3 files changed

+6
-6
lines changed

3 files changed

+6
-6
lines changed

SYCL/Matrix/element_wise_all_ops_cuda.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,7 @@
66
//
77
//===----------------------------------------------------------------------===//
88
// REQUIRES: cuda
9+
910
// RUN: %clangxx -fsycl -fsycl-targets=%sycl_triple -Xsycl-target-backend --cuda-gpu-arch=sm_80 -DSYCL_EXT_ONEAPI_MATRIX=3 %s -o %t.out
1011
// RUN: %t.out
1112

SYCL/Matrix/element_wise_wi_marray.cpp

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,7 @@
66
//
77
//===----------------------------------------------------------------------===//
88
// REQUIRES: cuda
9+
910
// RUN: %clangxx -fsycl -fsycl-targets=%sycl_triple -Xsycl-target-backend --cuda-gpu-arch=sm_80 -DSYCL_EXT_ONEAPI_MATRIX=3 %s -o %t.out
1011
// RUN: %t.out
1112

@@ -26,7 +27,7 @@ template <typename T, size_t M, size_t K> void verify_wi_marray(queue q) {
2627

2728
cgh.parallel_for<class marray_kernel>(
2829
nd_range<2>({1, 1 * SG_SZ}, {1, 1 * SG_SZ}),
29-
[ERR](nd_item<2> spmd_item)[[sycl::reqd_sub_group_size(SG_SZ)]] {
30+
[ERR](nd_item<2> spmd_item) [[sycl::reqd_sub_group_size(SG_SZ)]] {
3031
auto sg = spmd_item.get_sub_group();
3132

3233
joint_matrix<T, matrix_use::a, M, K> sub_a;
@@ -47,8 +48,7 @@ template <typename T, size_t M, size_t K> void verify_wi_marray(queue q) {
4748
}
4849
}
4950
}); // parallel for
50-
})
51-
.wait();
51+
}).wait();
5252
}
5353
assert(err == 0);
5454
}

SYCL/Matrix/joint_matrix_tensorcore.cpp

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
11
// REQUIRES: cuda
2-
32
// RUN: %clangxx -fsycl -fsycl-targets=%sycl_triple -Xsycl-target-backend --cuda-gpu-arch=sm_80 -DSYCL_EXT_ONEAPI_MATRIX=3 %s -o %t.out
43
// RUN: %t.out
54
//
@@ -68,8 +67,8 @@ T2 matrix_ref_mn(const int &m, const int &n, T1 *A, T1 *B, T2 *C) {
6867
res += make_fp32(A[m * Big_K + k]) * make_fp32(B[k * Big_N + n]);
6968
} else if constexpr (std::is_same<T1, bfloat16>::value) {
7069
for (int k = 0; k < Big_K; k++)
71-
res += make_fp32(A[m * Big_K + k].raw()) *
72-
make_fp32(B[k * Big_N + n].raw());
70+
res +=
71+
make_fp32(A[m * Big_K + k].raw()) * make_fp32(B[k * Big_N + n].raw());
7372
} else {
7473
for (int k = 0; k < Big_K; k++)
7574

0 commit comments

Comments
 (0)