2 // Copyright (c) 2019 Intel Corporation
4 // Licensed under the Apache License, Version 2.0 (the "License");
5 // you may not use this file except in compliance with the License.
6 // You may obtain a copy of the License at
8 // http://www.apache.org/licenses/LICENSE-2.0
10 // Unless required by applicable law or agreed to in writing, software
11 // distributed under the License is distributed on an "AS IS" BASIS,
12 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 // See the License for the specific language governing permissions and
14 // limitations under the License.
17 #include "reverse_sequence_inst.h"
18 #include "primitive_gpu_base.h"
19 #include "implementation_map.h"
20 #include "kernel_selector_helper.h"
21 #include "reverse_sequence/reverse_sequence_kernel_selector.h"
22 #include "reverse_sequence/reverse_sequence_kernel_ref.h"
23 #include "error_handler.h"
25 using namespace cldnn;
27 namespace cldnn { namespace gpu
29 struct reverse_sequence_gpu : typed_primitive_gpu_impl<reverse_sequence>
31 using parent = typed_primitive_gpu_impl<reverse_sequence>;
36 static primitive_impl* create(const reverse_sequence_node& arg)
38 auto reverse_sequence_params = get_default_params<kernel_selector::reverse_sequence_params>(arg);
39 auto reverse_sequence_optional_params = get_default_optional_params<kernel_selector::reverse_sequence_optional_params>(arg.get_program());
41 reverse_sequence_params.seq_axis = arg.get_primitive()->seq_axis;
42 reverse_sequence_params.batch_axis = arg.get_primitive()->batch_axis;
44 reverse_sequence_params.inputs.push_back(convert_data_tensor(arg.input(1).get_output_layout()));
46 auto& kernel_selector = kernel_selector::reverse_sequence_kernel_selector::Instance();
47 auto best_kernels = kernel_selector.GetBestKernels(reverse_sequence_params, reverse_sequence_optional_params);
49 CLDNN_ERROR_BOOL(arg.id(), "Best_kernel.empty()", best_kernels.empty(), "Cannot find a proper kernel with this arguments");
51 auto reverse_sequence = new reverse_sequence_gpu(arg, best_kernels[0]);
53 return reverse_sequence;
63 auto val_fw = reverse_sequence_gpu::create;
64 implementation_map<reverse_sequence>::add(std::make_tuple(engine_types::ocl, data_types::f32, format::bfyx), val_fw);
65 implementation_map<reverse_sequence>::add(std::make_tuple(engine_types::ocl, data_types::f16, format::bfyx), val_fw);