DPNP C++ backend kernel library 0.18.0dev1
Data Parallel Extension for NumPy*
Loading...
Searching...
No Matches
common.hpp
1//*****************************************************************************
2// Copyright (c) 2025, Intel Corporation
3// All rights reserved.
4//
5// Redistribution and use in source and binary forms, with or without
6// modification, are permitted provided that the following conditions are met:
7// - Redistributions of source code must retain the above copyright notice,
8// this list of conditions and the following disclaimer.
9// - Redistributions in binary form must reproduce the above copyright notice,
10// this list of conditions and the following disclaimer in the documentation
11// and/or other materials provided with the distribution.
12//
13// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
14// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
15// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
16// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
17// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
18// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
19// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
20// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
21// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
22// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
23// THE POSSIBILITY OF SUCH DAMAGE.
24//*****************************************************************************
25
26#pragma once
27
28#include <pybind11/pybind11.h>
29#include <pybind11/stl.h>
30#include <sycl/sycl.hpp>
31
32#include "dpctl4pybind11.hpp"
33#include "utils/output_validation.hpp"
34#include "utils/type_dispatch.hpp"
35#include "utils/type_utils.hpp"
36
37namespace dpnp::extensions::window
38{
39
40namespace dpctl_td_ns = dpctl::tensor::type_dispatch;
41
42namespace py = pybind11;
43
44typedef sycl::event (*window_fn_ptr_t)(sycl::queue &,
45 char *,
46 const std::size_t,
47 const std::vector<sycl::event> &);
48
49template <typename T, template <typename> class Functor>
50sycl::event window_impl(sycl::queue &q,
51 char *result,
52 const std::size_t nelems,
53 const std::vector<sycl::event> &depends)
54{
55 dpctl::tensor::type_utils::validate_type_for_device<T>(q);
56
57 T *res = reinterpret_cast<T *>(result);
58
59 sycl::event window_ev = q.submit([&](sycl::handler &cgh) {
60 cgh.depends_on(depends);
61
62 using WindowKernel = Functor<T>;
63 cgh.parallel_for<WindowKernel>(sycl::range<1>(nelems),
64 WindowKernel(res, nelems));
65 });
66
67 return window_ev;
68}
69
70template <typename funcPtrT>
71std::tuple<size_t, char *, funcPtrT>
72 window_fn(sycl::queue &exec_q,
73 const dpctl::tensor::usm_ndarray &result,
74 const funcPtrT *window_dispatch_vector)
75{
76 dpctl::tensor::validation::CheckWritable::throw_if_not_writable(result);
77
78 int nd = result.get_ndim();
79 if (nd != 1) {
80 throw py::value_error("Array should be 1d");
81 }
82
83 if (!dpctl::utils::queues_are_compatible(exec_q, {result.get_queue()})) {
84 throw py::value_error(
85 "Execution queue is not compatible with allocation queue.");
86 }
87
88 const bool is_result_c_contig = result.is_c_contiguous();
89 if (!is_result_c_contig) {
90 throw py::value_error("The result input array is not c-contiguous.");
91 }
92
93 size_t nelems = result.get_size();
94 if (nelems == 0) {
95 return std::make_tuple(nelems, nullptr, nullptr);
96 }
97
98 int result_typenum = result.get_typenum();
99 auto array_types = dpctl_td_ns::usm_ndarray_types();
100 int result_type_id = array_types.typenum_to_lookup_id(result_typenum);
101 funcPtrT fn = window_dispatch_vector[result_type_id];
102
103 if (fn == nullptr) {
104 throw std::runtime_error("Type of given array is not supported");
105 }
106
107 char *result_typeless_ptr = result.get_data();
108 return std::make_tuple(nelems, result_typeless_ptr, fn);
109}
110
111inline std::pair<sycl::event, sycl::event>
112 py_window(sycl::queue &exec_q,
113 const dpctl::tensor::usm_ndarray &result,
114 const std::vector<sycl::event> &depends,
115 const window_fn_ptr_t *window_dispatch_vector)
116{
117 auto [nelems, result_typeless_ptr, fn] =
118 window_fn<window_fn_ptr_t>(exec_q, result, window_dispatch_vector);
119
120 if (nelems == 0) {
121 return std::make_pair(sycl::event{}, sycl::event{});
122 }
123
124 sycl::event window_ev = fn(exec_q, result_typeless_ptr, nelems, depends);
125 sycl::event args_ev =
126 dpctl::utils::keep_args_alive(exec_q, {result}, {window_ev});
127
128 return std::make_pair(args_ev, window_ev);
129}
130
131template <typename funcPtrT,
132 template <typename fnT, typename T>
133 typename factoryT>
134void init_window_dispatch_vectors(funcPtrT window_dispatch_vector[])
135{
136 dpctl_td_ns::DispatchVectorBuilder<funcPtrT, factoryT,
137 dpctl_td_ns::num_types>
138 contig;
139 contig.populate_dispatch_vector(window_dispatch_vector);
140
141 return;
142}
143
144} // namespace dpnp::extensions::window