@@ -62,8 +62,6 @@ class __copyAcc2Acc;
62
62
namespace cl {
63
63
namespace sycl {
64
64
65
- namespace csd = cl::sycl::detail;
66
-
67
65
// Forward declaration
68
66
69
67
template <typename T, int Dimensions, typename AllocatorT> class buffer ;
@@ -106,7 +104,7 @@ template <typename Name, typename Type> struct get_kernel_name_t {
106
104
};
107
105
108
106
// / Specialization for the case when \c Name is undefined.
109
- template <typename Type> struct get_kernel_name_t <csd ::auto_name, Type> {
107
+ template <typename Type> struct get_kernel_name_t <detail ::auto_name, Type> {
110
108
using name = Type;
111
109
};
112
110
@@ -409,9 +407,9 @@ class handler {
409
407
break ;
410
408
case detail::CG::PREFETCH_USM:
411
409
CommandGroup.reset (new detail::CGPrefetchUSM (
412
- MDstPtr, MLength, std::move (MArgsStorage),
413
- std::move (MAccStorage ), std::move (MSharedPtrStorage ),
414
- std::move (MRequirements), std::move ( MEvents)));
410
+ MDstPtr, MLength, std::move (MArgsStorage), std::move (MAccStorage),
411
+ std::move (MSharedPtrStorage ), std::move (MRequirements ),
412
+ std::move (MEvents)));
415
413
break ;
416
414
case detail::CG::NONE:
417
415
throw runtime_error (" Command group submitted without a kernel or a "
@@ -666,7 +664,7 @@ class handler {
666
664
extractArgsAndReqsFromLambda (MHostKernel->getPtr (), KI::getNumParams (),
667
665
&KI::getParamDesc (0 ));
668
666
MKernelName = KI::getName ();
669
- MOSModuleHandle = csd ::OSUtil::getOSModuleHandle (KI::getName ());
667
+ MOSModuleHandle = detail ::OSUtil::getOSModuleHandle (KI::getName ());
670
668
} else {
671
669
// In case w/o the integration header it is necessary to process
672
670
// accessors from the list(which are associated with this handler) as
@@ -676,9 +674,10 @@ class handler {
676
674
}
677
675
678
676
// single_task version with a kernel represented as a lambda.
679
- template <typename KernelName = csd ::auto_name, typename KernelType>
677
+ template <typename KernelName = detail ::auto_name, typename KernelType>
680
678
void single_task (KernelType KernelFunc) {
681
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
679
+ using NameT =
680
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
682
681
#ifdef __SYCL_DEVICE_ONLY__
683
682
kernel_single_task<NameT>(KernelFunc);
684
683
#else
@@ -691,9 +690,11 @@ class handler {
691
690
692
691
// parallel_for version with a kernel represented as a lambda + range that
693
692
// specifies global size only.
694
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
693
+ template <typename KernelName = detail::auto_name, typename KernelType,
694
+ int Dims>
695
695
void parallel_for (range<Dims> NumWorkItems, KernelType KernelFunc) {
696
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
696
+ using NameT =
697
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
697
698
#ifdef __SYCL_DEVICE_ONLY__
698
699
kernel_parallel_for<NameT, KernelType, Dims>(KernelFunc);
699
700
#else
@@ -708,17 +709,18 @@ class handler {
708
709
MNDRDesc.set (range<1 >{1 });
709
710
710
711
MArgs = std::move (MAssociatedAccesors);
711
- MHostKernel.reset (
712
- new detail::HostKernel<FuncT, void , 1 >(std::move (Func)));
712
+ MHostKernel.reset (new detail::HostKernel<FuncT, void , 1 >(std::move (Func)));
713
713
MCGType = detail::CG::RUN_ON_HOST_INTEL;
714
714
}
715
715
716
716
// parallel_for version with a kernel represented as a lambda + range and
717
717
// offset that specify global size and global offset correspondingly.
718
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
718
+ template <typename KernelName = detail::auto_name, typename KernelType,
719
+ int Dims>
719
720
void parallel_for (range<Dims> NumWorkItems, id<Dims> WorkItemOffset,
720
721
KernelType KernelFunc) {
721
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
722
+ using NameT =
723
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
722
724
#ifdef __SYCL_DEVICE_ONLY__
723
725
kernel_parallel_for<NameT, KernelType, Dims>(KernelFunc);
724
726
#else
@@ -730,9 +732,11 @@ class handler {
730
732
731
733
// parallel_for version with a kernel represented as a lambda + nd_range that
732
734
// specifies global, local sizes and offset.
733
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
735
+ template <typename KernelName = detail::auto_name, typename KernelType,
736
+ int Dims>
734
737
void parallel_for (nd_range<Dims> ExecutionRange, KernelType KernelFunc) {
735
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
738
+ using NameT =
739
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
736
740
#ifdef __SYCL_DEVICE_ONLY__
737
741
kernel_parallel_for<NameT, KernelType, Dims>(KernelFunc);
738
742
#else
@@ -742,10 +746,12 @@ class handler {
742
746
#endif
743
747
}
744
748
745
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
749
+ template <typename KernelName = detail::auto_name, typename KernelType,
750
+ int Dims>
746
751
void parallel_for_work_group (range<Dims> NumWorkGroups,
747
752
KernelType KernelFunc) {
748
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
753
+ using NameT =
754
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
749
755
#ifdef __SYCL_DEVICE_ONLY__
750
756
kernel_parallel_for_work_group<NameT, KernelType, Dims>(KernelFunc);
751
757
#else
@@ -755,11 +761,13 @@ class handler {
755
761
#endif // __SYCL_DEVICE_ONLY__
756
762
}
757
763
758
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
764
+ template <typename KernelName = detail::auto_name, typename KernelType,
765
+ int Dims>
759
766
void parallel_for_work_group (range<Dims> NumWorkGroups,
760
767
range<Dims> WorkGroupSize,
761
768
KernelType KernelFunc) {
762
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
769
+ using NameT =
770
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
763
771
#ifdef __SYCL_DEVICE_ONLY__
764
772
kernel_parallel_for_work_group<NameT, KernelType, Dims>(KernelFunc);
765
773
#else
@@ -823,9 +831,10 @@ class handler {
823
831
// single_task version which takes two "kernels". One is a lambda which is
824
832
// used if device, queue is bound to, is host device. Second is a sycl::kernel
825
833
// which is used otherwise.
826
- template <typename KernelName = csd ::auto_name, typename KernelType>
834
+ template <typename KernelName = detail ::auto_name, typename KernelType>
827
835
void single_task (kernel SyclKernel, KernelType KernelFunc) {
828
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
836
+ using NameT =
837
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
829
838
#ifdef __SYCL_DEVICE_ONLY__
830
839
kernel_single_task<NameT>(KernelFunc);
831
840
#else
@@ -842,10 +851,12 @@ class handler {
842
851
// parallel_for version which takes two "kernels". One is a lambda which is
843
852
// used if device, queue is bound to, is host device. Second is a sycl::kernel
844
853
// which is used otherwise. range argument specifies global size.
845
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
854
+ template <typename KernelName = detail::auto_name, typename KernelType,
855
+ int Dims>
846
856
void parallel_for (kernel SyclKernel, range<Dims> NumWorkItems,
847
857
KernelType KernelFunc) {
848
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
858
+ using NameT =
859
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
849
860
#ifdef __SYCL_DEVICE_ONLY__
850
861
kernel_parallel_for<NameT, KernelType, Dims>(KernelFunc);
851
862
#else
@@ -862,10 +873,12 @@ class handler {
862
873
// parallel_for version which takes two "kernels". One is a lambda which is
863
874
// used if device, queue is bound to, is host device. Second is a sycl::kernel
864
875
// which is used otherwise. range and id specify global size and offset.
865
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
876
+ template <typename KernelName = detail::auto_name, typename KernelType,
877
+ int Dims>
866
878
void parallel_for (kernel SyclKernel, range<Dims> NumWorkItems,
867
879
id<Dims> WorkItemOffset, KernelType KernelFunc) {
868
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
880
+ using NameT =
881
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
869
882
#ifdef __SYCL_DEVICE_ONLY__
870
883
kernel_parallel_for<NameT, KernelType, Dims>(KernelFunc);
871
884
#else
@@ -882,10 +895,12 @@ class handler {
882
895
// parallel_for version which takes two "kernels". One is a lambda which is
883
896
// used if device, queue is bound to, is host device. Second is a sycl::kernel
884
897
// which is used otherwise. nd_range specifies global, local size and offset.
885
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
898
+ template <typename KernelName = detail::auto_name, typename KernelType,
899
+ int Dims>
886
900
void parallel_for (kernel SyclKernel, nd_range<Dims> NDRange,
887
901
KernelType KernelFunc) {
888
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
902
+ using NameT =
903
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
889
904
#ifdef __SYCL_DEVICE_ONLY__
890
905
kernel_parallel_for<NameT, KernelType, Dims>(KernelFunc);
891
906
#else
@@ -905,10 +920,12 @@ class handler {
905
920
// / of the kernel. The same source kernel can be compiled multiple times
906
921
// / yielding multiple kernel class objects accessible via the \c program class
907
922
// / interface.
908
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
923
+ template <typename KernelName = detail::auto_name, typename KernelType,
924
+ int Dims>
909
925
void parallel_for_work_group (kernel SyclKernel, range<Dims> NumWorkGroups,
910
926
KernelType KernelFunc) {
911
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
927
+ using NameT =
928
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
912
929
#ifdef __SYCL_DEVICE_ONLY__
913
930
kernel_parallel_for_work_group<NameT, KernelType, Dims>(KernelFunc);
914
931
#else
@@ -921,11 +938,13 @@ class handler {
921
938
922
939
// / Two-kernel version of the \c parallel_for_work_group with group and local
923
940
// / range.
924
- template <typename KernelName = csd::auto_name, typename KernelType, int Dims>
941
+ template <typename KernelName = detail::auto_name, typename KernelType,
942
+ int Dims>
925
943
void parallel_for_work_group (kernel SyclKernel, range<Dims> NumWorkGroups,
926
944
range<Dims> WorkGroupSize,
927
945
KernelType KernelFunc) {
928
- using NameT = typename csd::get_kernel_name_t <KernelName, KernelType>::name;
946
+ using NameT =
947
+ typename detail::get_kernel_name_t <KernelName, KernelType>::name;
929
948
#ifdef __SYCL_DEVICE_ONLY__
930
949
kernel_parallel_for_work_group<NameT, KernelType, Dims>(KernelFunc);
931
950
#else
@@ -1083,7 +1102,7 @@ class handler {
1083
1102
// Shapes can be 1, 2 or 3 dimensional rectangles.
1084
1103
template <int Dims_Src, int Dims_Dst>
1085
1104
static bool IsCopyingRectRegionAvailable (const range<Dims_Src> Src,
1086
- const range<Dims_Dst> Dst) {
1105
+ const range<Dims_Dst> Dst) {
1087
1106
if (Dims_Src > Dims_Dst)
1088
1107
return false ;
1089
1108
for (size_t I = 0 ; I < Dims_Src; ++I)
@@ -1092,7 +1111,7 @@ class handler {
1092
1111
return true ;
1093
1112
}
1094
1113
1095
- // copy memory pointed by accessor to the memory pointed by another accessor
1114
+ // copy memory pointed by accessor to the memory pointed by another accessor
1096
1115
template <
1097
1116
typename T_Src, int Dims_Src, access::mode AccessMode_Src,
1098
1117
access::target AccessTarget_Src, typename T_Dst, int Dims_Dst,
@@ -1209,7 +1228,7 @@ class handler {
1209
1228
}
1210
1229
1211
1230
// Copy memory from the source to the destination.
1212
- void memcpy (void * Dest, const void * Src, size_t Count) {
1231
+ void memcpy (void * Dest, const void * Src, size_t Count) {
1213
1232
MSrcPtr = const_cast <void *>(Src);
1214
1233
MDstPtr = Dest;
1215
1234
MLength = Count;
0 commit comments