Compute Library: arm_compute/runtime/NEON/functions/NEFullyConnectedLayer.h Source File

 /*

  * Copyright (c) 2017 ARM Limited.

  *

  * SPDX-License-Identifier: MIT

  *

  * Permission is hereby granted, free of charge, to any person obtaining a copy

  * of this software and associated documentation files (the "Software"), to

  * deal in the Software without restriction, including without limitation the

  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or

  * sell copies of the Software, and to permit persons to whom the Software is

  * furnished to do so, subject to the following conditions:

  *

  * The above copyright notice and this permission notice shall be included in all

  * copies or substantial portions of the Software.

  *

  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE

  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,

  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE

  * SOFTWARE.

  */

 #ifndef __ARM_COMPUTE_NEFULLYCONNECTEDLAYER_H__

 #define __ARM_COMPUTE_NEFULLYCONNECTEDLAYER_H__


 #include "arm_compute/runtime/IFunction.h"


 #include "arm_compute/core/NEON/kernels/NEGEMMInterleave4x4Kernel.h"

 #include "arm_compute/core/NEON/kernels/NEGEMMMatrixAccumulateBiasesKernel.h"

 #include "arm_compute/core/NEON/kernels/NEGEMMMatrixMultiplyKernel.h"

 #include "arm_compute/core/NEON/kernels/NEGEMMTranspose1xWKernel.h"

 #include "arm_compute/core/NEON/kernels/NEIm2ColKernel.h"

 #include "arm_compute/core/NEON/kernels/NETransposeKernel.h"

 #include "arm_compute/runtime/MemoryGroup.h"

 #include "arm_compute/runtime/Tensor.h"


 namespace arm_compute

 {

 class NEFullyConnectedLayerReshapeWeights : public IFunction

 {

 public:

     NEFullyConnectedLayerReshapeWeights(std::shared_ptr<IMemoryManager> memory_manager = nullptr);

     void configure(const ITensor *input, ITensor *output, bool transpose_weights, bool is_batched_fc_layer);


     // Inherited methods overridden:

     void run() override;


 private:

     MemoryGroup              _memory_group;

     NETransposeKernel        _transpose_kernel;

     NEGEMMTranspose1xWKernel _transpose1xW_kernel;

     Tensor                   _transpose_output;

     bool                     _transpose_weights;

     bool                     _is_batched_fc_layer;

 };


 class NEFullyConnectedLayer : public IFunction

 {

 public:

     NEFullyConnectedLayer(std::shared_ptr<IMemoryManager> memory_manager = nullptr);

     void configure(const ITensor *input, const ITensor *weights, const ITensor *biases, ITensor *output, bool transpose_weights = true, bool are_weights_reshaped = false);


     //Inherited methods override

     void run() override;


 private:

     MemoryGroup                         _memory_group;

     NEIm2ColKernel                      _im2col_kernel;

     NEFullyConnectedLayerReshapeWeights _reshape_weights_kernel;

     NEGEMMInterleave4x4Kernel           _interleave4x4_kernel;

     NEGEMMMatrixMultiplyKernel          _mm_kernel;

     NEGEMMMatrixAccumulateBiasesKernel  _accumulate_biases_kernel;

     Tensor                              _im2col_output;

     Tensor                              _interleave4x4_output;

     Tensor                              _reshape_weights_output;

     bool                                _are_weights_reshaped;

     bool                                _is_batched_fc_layer;

     bool                                _linearize_input;

     bool                                _accumulate_biases;

 };

 }

 #endif /* __ARM_COMPUTE_NEFULLYCONNECTEDLAYER_H__ */

NEGEMMInterleave4x4Kernel.h

NEGEMMMatrixMultiplyKernel.h

arm_compute::IFunction
Base class for all functions.
Definition: IFunction.h:30

arm_compute::NEFullyConnectedLayerReshapeWeights
Basic function to reshape the weights of Fully Connected layer with NEON.
Definition: NEFullyConnectedLayer.h:47

arm_compute::NEFullyConnectedLayerReshapeWeights::configure
void configure(const ITensor *input, ITensor *output, bool transpose_weights, bool is_batched_fc_layer)
Set the input and output tensors.

arm_compute::NEIm2ColKernel
Interface for the im2col reshape kernel.
Definition: NEIm2ColKernel.h:57

arm_compute::NEFullyConnectedLayer::NEFullyConnectedLayer
NEFullyConnectedLayer(std::shared_ptr< IMemoryManager > memory_manager=nullptr)
Constructor.

arm_compute::NEFullyConnectedLayer::configure
void configure(const ITensor *input, const ITensor *weights, const ITensor *biases, ITensor *output, bool transpose_weights=true, bool are_weights_reshaped=false)
Set the input and output tensors.

arm_compute::ITensor
Interface for NEON tensor.
Definition: ITensor.h:36

NEGEMMTranspose1xWKernel.h

arm_compute::NEGEMMInterleave4x4Kernel
NEON kernel to interleave the elements of a matrix.
Definition: NEGEMMInterleave4x4Kernel.h:52

arm_compute::NETransposeKernel
NEON kernel which transposes the elements of a matrix.
Definition: NETransposeKernel.h:38

arm_compute::NEGEMMMatrixAccumulateBiasesKernel
NEON kernel to add a bias to each row of the input tensor.
Definition: NEGEMMMatrixAccumulateBiasesKernel.h:33

NETransposeKernel.h

arm_compute::NEGEMMTranspose1xWKernel
NEON kernel which transposes the elements of a matrix in chunks of 1xW, where W is equal to (16 / ele...
Definition: NEGEMMTranspose1xWKernel.h:68

arm_compute::Tensor
Basic implementation of the tensor interface.
Definition: Tensor.h:37

arm_compute::NEFullyConnectedLayerReshapeWeights::run
void run() override
Run the kernels contained in the function.

MemoryGroup.h

arm_compute::NEFullyConnectedLayer
Basic function to compute a Fully Connected layer on NEON.
Definition: NEFullyConnectedLayer.h:82

arm_compute::MemoryGroupBase< Tensor >

NEGEMMMatrixAccumulateBiasesKernel.h

arm_compute::NEFullyConnectedLayer::run
void run() override
Run the kernels contained in the function.

arm_compute::NEFullyConnectedLayerReshapeWeights::NEFullyConnectedLayerReshapeWeights
NEFullyConnectedLayerReshapeWeights(std::shared_ptr< IMemoryManager > memory_manager=nullptr)
Constructor.

IFunction.h

NEIm2ColKernel.h

Tensor.h

arm_compute::NEGEMMMatrixMultiplyKernel
NEON kernel to multiply two input matrices "A" and "B".
Definition: NEGEMMMatrixMultiplyKernel.h:39