Publishing 2019 R1 content
[platform/upstream/dldt.git] / inference-engine / thirdparty / clDNN / src / gpu / depth_to_space_gpu.cpp
1 /*
2 // Copyright (c) 2019 Intel Corporation
3 //
4 // Licensed under the Apache License, Version 2.0 (the "License");
5 // you may not use this file except in compliance with the License.
6 // You may obtain a copy of the License at
7 //
8 //      http://www.apache.org/licenses/LICENSE-2.0
9 //
10 // Unless required by applicable law or agreed to in writing, software
11 // distributed under the License is distributed on an "AS IS" BASIS,
12 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 // See the License for the specific language governing permissions and
14 // limitations under the License.
15 */
16
17 #include "depth_to_space_inst.h"
18 #include "primitive_gpu_base.h"
19 #include "implementation_map.h"
20 #include "kernel_selector_helper.h"
21 #include "depth_to_space/depth_to_space_kernel_selector.h"
22 #include "depth_to_space/depth_to_space_kernel_ref.h"
23 #include "error_handler.h"
24
25 using namespace cldnn;
26
27 namespace cldnn
28 {
29     namespace gpu
30     {
31         struct depth_to_space_gpu : typed_primitive_gpu_impl<depth_to_space>
32         {
33             using parent = typed_primitive_gpu_impl<depth_to_space>;
34             using parent::parent;
35
36         public:
37
38             static primitive_impl* create(const depth_to_space_node& arg)
39             {
40                 auto depth_to_space_params = get_default_params<kernel_selector::depth_to_space_params>(arg);
41                 auto depth_to_space_optional_params =
42                         get_default_optional_params<kernel_selector::depth_to_space_optional_params>(arg.get_program());
43
44                 depth_to_space_params.block_size = arg.get_primitive()->block_size;
45
46                 auto& kernel_selector = kernel_selector::depth_to_space_kernel_selector::Instance();
47                 auto best_kernels = kernel_selector.GetBestKernels(depth_to_space_params, depth_to_space_optional_params);
48
49                 CLDNN_ERROR_BOOL(arg.id(), "Best_kernel.empty()", best_kernels.empty(), "Cannot find a proper kernel with this arguments");
50
51                 auto depth_to_space = new depth_to_space_gpu(arg, best_kernels[0]);
52
53                 return depth_to_space;
54             }
55         };
56
57         namespace
58         {
59             struct attach
60             {
61                 attach()
62                 {
63                     auto val_fw = depth_to_space_gpu::create;
64                     implementation_map<depth_to_space>::add(std::make_tuple(engine_types::ocl, data_types::f32, format::bfyx), val_fw);
65                     implementation_map<depth_to_space>::add(std::make_tuple(engine_types::ocl, data_types::f16, format::bfyx), val_fw);
66                 }
67                 ~attach() = default;
68             };
69             attach attach_impl;
70         }
71     } //namespace cldnn
72 } //namespace gpu