1 // This file is part of OpenCV project.
2 // It is subject to the license terms in the LICENSE file found in the top-level directory
3 // of this distribution and at http://opencv.org/license.html.
5 #ifndef OPENCV_DNN_SRC_CUDA4DNN_PRIMITIVES_PERMUTE_HPP
6 #define OPENCV_DNN_SRC_CUDA4DNN_PRIMITIVES_PERMUTE_HPP
8 #include "../../op_cuda.hpp"
10 #include "../csl/stream.hpp"
11 #include "../csl/tensor_ops.hpp"
13 #include "../kernels/permute.hpp"
15 #include <opencv2/core.hpp>
21 namespace cv { namespace dnn { namespace cuda4dnn {
24 class PermuteOp final : public CUDABackendNode {
26 using wrapper_type = GetCUDABackendWrapperType<T>;
28 PermuteOp(csl::Stream stream_, std::vector<std::size_t> order_)
29 : stream(std::move(stream_)), order(std::move(order_)) { }
32 const std::vector<cv::Ptr<BackendWrapper>>& inputs,
33 const std::vector<cv::Ptr<BackendWrapper>>& outputs,
34 csl::Workspace& workspace) override
36 for (int i = 0; i < inputs.size(); i++)
38 auto input_wrapper = inputs[i].dynamicCast<wrapper_type>();
39 auto input = input_wrapper->getView();
41 auto output_wrapper = outputs[i].dynamicCast<wrapper_type>();
42 auto output = output_wrapper->getSpan();
44 auto needsPermute = [&] {
45 for (int i = 0; i < order.size(); i++)
53 kernels::permute(stream, output, input, order);
57 if (input.get() != output.get())
58 csl::tensor_ops::copy(stream, output, input);
65 std::vector<std::size_t> order;
68 }}} /* namespace cv::dnn::cuda4dnn */
70 #endif /* OPENCV_DNN_SRC_CUDA4DNN_PRIMITIVES_PERMUTE_HPP */