1 // Copyright (c) 2016 Intel Corporation
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
7 // http://www.apache.org/licenses/LICENSE-2.0
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
18 #include "fully_connected_kernel_base.h"
21 namespace kernel_selector {
23 class FullyConnectedKernelMMAD : public FullyConnectedKernelBase {
25 using Parent = FullyConnectedKernelBase;
27 FullyConnectedKernelMMAD() : Parent("fully_connected_gpu_MMAD") {}
29 KernelsData GetKernelsData(const Params& params, const optional_params& options) const override;
30 ParamsKey GetSupportedKey() const override;
32 struct FullyConnectedTuningData {
33 const size_t sub_group_size = 8;
34 size_t slm_div_factor = 1;
35 size_t work_group_size = 1;
39 JitConstants GetJitConstants(const fully_connected_params& params, const DispatchData& kd) const override;
40 DispatchData SetDefault(const fully_connected_params& params, int autoTuneIndex = -1) const override;
41 std::vector<FusedOpType> GetSupportedFusedOps() const override {
42 return { FusedOpType::QUANTIZE,
44 FusedOpType::ACTIVATION };
46 bool Validate(const Params& params, const optional_params& options) const override;
47 FullyConnectedTuningData SetTuningParams(const fully_connected_params& params) const;
49 } // namespace kernel_selector