Moved full ctor to dedicated file

oleksandr-pavlyk · oleksandr-pavlyk · commit 40739b499bbc · 2022-10-07T12:49:44.000-05:00
diff --git a/dpctl/tensor/CMakeLists.txt b/dpctl/tensor/CMakeLists.txt
@@ -23,6 +23,7 @@ pybind11_add_module(${python_module_name} MODULE
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/copy_numpy_ndarray_into_usm_ndarray.cpp
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/copy_for_reshape.cpp
     ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/linear_sequences.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/full_ctor.cpp
 )
 target_link_options(${python_module_name} PRIVATE -fsycl-device-code-split=per_kernel)
 target_include_directories(${python_module_name}
diff --git a/dpctl/tensor/libtensor/source/full_ctor.cpp b/dpctl/tensor/libtensor/source/full_ctor.cpp
@@ -0,0 +1,116 @@
+//===-- ------------ Implementation of _tensor_impl module  ----*-C++-*-/===//
+//
+//                      Data Parallel Control (dpctl)
+//
+// Copyright 2020-2022 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//    http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//===--------------------------------------------------------------------===//
+///
+/// \file
+/// This file defines functions of dpctl.tensor._tensor_impl extensions
+//===--------------------------------------------------------------------===//
+
+#include "dpctl4pybind11.hpp"
+#include <CL/sycl.hpp>
+#include <complex>
+#include <pybind11/complex.h>
+#include <pybind11/pybind11.h>
+#include <utility>
+#include <vector>
+
+#include "kernels/constructors.hpp"
+#include "utils/strided_iters.hpp"
+#include "utils/type_dispatch.hpp"
+#include "utils/type_utils.hpp"
+
+#include "full_ctor.hpp"
+
+namespace py = pybind11;
+namespace _ns = dpctl::tensor::detail;
+
+namespace dpctl
+{
+namespace tensor
+{
+namespace py_internal
+{
+
+using dpctl::tensor::kernels::constructors::lin_space_step_fn_ptr_t;
+using dpctl::utils::keep_args_alive;
+
+using dpctl::tensor::kernels::constructors::full_contig_fn_ptr_t;
+
+static full_contig_fn_ptr_t full_contig_dispatch_vector[_ns::num_types];
+
+std::pair<sycl::event, sycl::event>
+usm_ndarray_full(py::object py_value,
+                 dpctl::tensor::usm_ndarray dst,
+                 sycl::queue exec_q,
+                 const std::vector<sycl::event> &depends)
+{
+    // start, end should be coercible into data type of dst
+
+    py::ssize_t dst_nelems = dst.get_size();
+
+    if (dst_nelems == 0) {
+        // nothing to do
+        return std::make_pair(sycl::event(), sycl::event());
+    }
+
+    sycl::queue dst_q = dst.get_queue();
+    if (!dpctl::utils::queues_are_compatible(exec_q, {dst_q})) {
+        throw py::value_error(
+            "Execution queue is not compatible with the allocation queue");
+    }
+
+    auto array_types = dpctl::tensor::detail::usm_ndarray_types();
+    int dst_typenum = dst.get_typenum();
+    int dst_typeid = array_types.typenum_to_lookup_id(dst_typenum);
+
+    char *dst_data = dst.get_data();
+    sycl::event full_event;
+
+    if (dst_nelems == 1 || dst.is_c_contiguous() || dst.is_f_contiguous()) {
+        auto fn = full_contig_dispatch_vector[dst_typeid];
+
+        sycl::event full_contig_event =
+            fn(exec_q, static_cast<size_t>(dst_nelems), py_value, dst_data,
+               depends);
+
+        return std::make_pair(
+            keep_args_alive(exec_q, {dst}, {full_contig_event}),
+            full_contig_event);
+    }
+    else {
+        throw std::runtime_error(
+            "Only population of contiguous usm_ndarray objects is supported.");
+    }
+}
+
+void init_full_ctor_dispatch_vectors(void)
+{
+    using namespace dpctl::tensor::detail;
+    using dpctl::tensor::kernels::constructors::FullContigFactory;
+
+    DispatchVectorBuilder<full_contig_fn_ptr_t, FullContigFactory, num_types>
+        dvb;
+    dvb.populate_dispatch_vector(full_contig_dispatch_vector);
+
+    return;
+}
+
+} // namespace py_internal
+} // namespace tensor
+} // namespace dpctl
diff --git a/dpctl/tensor/libtensor/source/full_ctor.hpp b/dpctl/tensor/libtensor/source/full_ctor.hpp
@@ -0,0 +1,50 @@
+//===-- ------------ Implementation of _tensor_impl module  ----*-C++-*-/===//
+//
+//                      Data Parallel Control (dpctl)
+//
+// Copyright 2020-2022 Intel Corporation
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//    http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+//
+//===--------------------------------------------------------------------===//
+///
+/// \file
+/// This file defines functions of dpctl.tensor._tensor_impl extensions
+//===--------------------------------------------------------------------===//
+
+#pragma once
+#include <CL/sycl.hpp>
+#include <utility>
+#include <vector>
+
+#include "dpctl4pybind11.hpp"
+#include <pybind11/pybind11.h>
+
+namespace dpctl
+{
+namespace tensor
+{
+namespace py_internal
+{
+
+extern std::pair<sycl::event, sycl::event>
+usm_ndarray_full(py::object py_value,
+                 dpctl::tensor::usm_ndarray dst,
+                 sycl::queue exec_q,
+                 const std::vector<sycl::event> &depends = {});
+
+extern void init_full_ctor_dispatch_vectors(void);
+
+} // namespace py_internal
+} // namespace tensor
+} // namespace dpctl
diff --git a/dpctl/tensor/libtensor/source/tensor_py.cpp b/dpctl/tensor/libtensor/source/tensor_py.cpp
@@ -42,6 +42,7 @@
 #include "copy_and_cast_usm_to_usm.hpp"
 #include "copy_for_reshape.hpp"
 #include "copy_numpy_ndarray_into_usm_ndarray.hpp"
+#include "full_ctor.hpp"
 #include "linear_sequences.hpp"
 #include "simplify_iteration_space.hpp"
 
@@ -74,54 +75,7 @@ using dpctl::tensor::py_internal::usm_ndarray_linear_sequence_step;
 
 /* ================ Full ================== */
 
-using dpctl::tensor::kernels::constructors::full_contig_fn_ptr_t;
-
-static full_contig_fn_ptr_t full_contig_dispatch_vector[_ns::num_types];
-
-std::pair<sycl::event, sycl::event>
-usm_ndarray_full(py::object py_value,
-                 dpctl::tensor::usm_ndarray dst,
-                 sycl::queue exec_q,
-                 const std::vector<sycl::event> &depends = {})
-{
-    // start, end should be coercible into data type of dst
-
-    py::ssize_t dst_nelems = dst.get_size();
-
-    if (dst_nelems == 0) {
-        // nothing to do
-        return std::make_pair(sycl::event(), sycl::event());
-    }
-
-    sycl::queue dst_q = dst.get_queue();
-    if (!dpctl::utils::queues_are_compatible(exec_q, {dst_q})) {
-        throw py::value_error(
-            "Execution queue is not compatible with the allocation queue");
-    }
-
-    auto array_types = dpctl::tensor::detail::usm_ndarray_types();
-    int dst_typenum = dst.get_typenum();
-    int dst_typeid = array_types.typenum_to_lookup_id(dst_typenum);
-
-    char *dst_data = dst.get_data();
-    sycl::event full_event;
-
-    if (dst_nelems == 1 || dst.is_c_contiguous() || dst.is_f_contiguous()) {
-        auto fn = full_contig_dispatch_vector[dst_typeid];
-
-        sycl::event full_contig_event =
-            fn(exec_q, static_cast<size_t>(dst_nelems), py_value, dst_data,
-               depends);
-
-        return std::make_pair(
-            keep_args_alive(exec_q, {dst}, {full_contig_event}),
-            full_contig_event);
-    }
-    else {
-        throw std::runtime_error(
-            "Only population of contiguous usm_ndarray objects is supported.");
-    }
-}
+using dpctl::tensor::py_internal::usm_ndarray_full;
 
 /* ================ Eye ================== */
 
@@ -435,17 +389,13 @@ void init_dispatch_vectors(void)
 {
     dpctl::tensor::py_internal::init_copy_for_reshape_dispatch_vectors();
     dpctl::tensor::py_internal::init_linear_sequences_dispatch_vectors();
+    dpctl::tensor::py_internal::init_full_ctor_dispatch_vectors();
 
     using namespace dpctl::tensor::detail;
     using dpctl::tensor::kernels::constructors::EyeFactory;
-    using dpctl::tensor::kernels::constructors::FullContigFactory;
     using dpctl::tensor::kernels::constructors::TrilGenericFactory;
     using dpctl::tensor::kernels::constructors::TriuGenericFactory;
 
-    DispatchVectorBuilder<full_contig_fn_ptr_t, FullContigFactory, num_types>
-        dvb3;
-    dvb3.populate_dispatch_vector(full_contig_dispatch_vector);
-
     DispatchVectorBuilder<eye_fn_ptr_t, EyeFactory, num_types> dvb4;
     dvb4.populate_dispatch_vector(eye_dispatch_vector);
 

Original file line number	Diff line number	Diff line change
`@@ -23,6 +23,7 @@ pybind11_add_module(${python_module_name} MODULE`
`23`	`23`	`${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/copy_numpy_ndarray_into_usm_ndarray.cpp`
`24`	`24`	`${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/copy_for_reshape.cpp`
`25`	`25`	`${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/linear_sequences.cpp`
	`26`	`+ ${CMAKE_CURRENT_SOURCE_DIR}/libtensor/source/full_ctor.cpp`
`26`	`27`	`)`
`27`	`28`	`target_link_options(${python_module_name} PRIVATE -fsycl-device-code-split=per_kernel)`
`28`	`29`	`target_include_directories(${python_module_name}`