blob: 9fd0b4aaef9925a648e9b47dc600be29f7d4bbca [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
Matthew Benthamf1aeab92023-05-30 13:35:34 +00002 * Copyright (c) 2017-2021, 2023 Arm Limited.
Anthony Barbier6ff3b192017-09-04 18:44:23 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Michalis Spyrouf4643372019-11-29 16:17:13 +000024#ifndef ARM_COMPUTE_CLFULLYCONNECTEDLAYER_H
25#define ARM_COMPUTE_CLFULLYCONNECTEDLAYER_H
Anthony Barbier6ff3b192017-09-04 18:44:23 +010026
SiCong Li91295492023-07-21 18:16:13 +010027#include "arm_compute/function_info/FullyConnectedLayerInfo.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010028#include "arm_compute/runtime/CL/CLTensor.h"
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010029#include "arm_compute/runtime/IFunction.h"
Michalis Spyrou1a569a32019-09-10 17:20:34 +010030#include "arm_compute/runtime/IWeightsManager.h"
Georgios Pinitas26014cf2019-09-09 19:00:57 +010031#include "arm_compute/runtime/MemoryGroup.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010032
33namespace arm_compute
34{
Anthony Barbier6ff3b192017-09-04 18:44:23 +010035/** Basic function to compute a Fully Connected layer on OpenCL. This function calls the following OpenCL kernels:
36 *
Manuel Bottinid844c082021-07-14 12:58:54 +010037 * -# @ref opencl::kernels::ClIm2ColKernel (called when the input comes from a convolutional layer)
Teresa Charlin68508892021-04-07 19:18:08 +010038 * -# @ref CLTranspose (if @p are_weights_reshaped is set to false and transpose_weights is set to true ) (called once)
Gian Marco Iodicec9cecc02021-10-15 10:23:24 +010039 * -# @ref opencl::ClGemm or @ref CLGEMMLowpMatrixMultiplyCore (if quantized asymmetric)
Anthony Barbier6ff3b192017-09-04 18:44:23 +010040 *
41 * @note The fully connected layer accepts "weights" tensors only with 2 dimensions.
42 */
43class CLFullyConnectedLayer : public IFunction
44{
45public:
46 /** Constructor */
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010047 CLFullyConnectedLayer(std::shared_ptr<IMemoryManager> memory_manager = nullptr,
48 IWeightsManager *weights_manager = nullptr);
Georgios Pinitas529b5a22021-07-27 15:55:30 +010049 /** Default destructor */
50 ~CLFullyConnectedLayer();
Georgios Pinitas1562be32018-03-08 19:09:19 +000051 /** Prevent instances of this class from being copied (As this class contains pointers) */
52 CLFullyConnectedLayer(const CLFullyConnectedLayer &) = delete;
53 /** Default move constructor */
54 CLFullyConnectedLayer(CLFullyConnectedLayer &&) = default;
55 /** Prevent instances of this class from being copied (As this class contains pointers) */
56 CLFullyConnectedLayer &operator=(const CLFullyConnectedLayer &) = delete;
57 /** Default move assignment operator */
58 CLFullyConnectedLayer &operator=(CLFullyConnectedLayer &&) = default;
Anthony Barbier6ff3b192017-09-04 18:44:23 +010059 /** Set the input and output tensors.
60 *
Teresa Charlin62687422021-04-28 10:58:49 +010061 * Valid data layouts:
62 * - NHWC
63 * - NCHW
64 *
65 * Valid data type configurations:
66 * |src0 |src1 |src2 |dst |
67 * |:--------------|:------------------|:------|:--------------|
68 * |F16 |F16 |F16 |F16 |
69 * |F32 |F32 |F32 |F32 |
70 * |QASYMM8 |QASYMM8 |S32 |QASYMM8 |
71 * |QASYMM8_SIGNED |QASYMM8_SIGNED |S32 |QASYMM8_SIGNED |
72 *
Manuel Bottini2b84be52020-04-08 10:15:51 +010073 * @param[in] compile_context The compile context to be used.
74 * @param[in] input Source tensor. Data type supported: QASYMM8/QASYMM8_SIGNED/F16/F32.
75 * @param[in] weights Weights tensor. The weights must be 2 dimensional.
76 * If this function is called after a Convolution Layer, the (transposed) weights will have as many rows as the product of the first 3 input's dimensions.
77 * If it is called after another FullyConnected Layer, the (transposed) weights will have as many rows as the input's first dimension.
78 * Data type supported: Same as @p input.
79 * @param[in] biases Bias tensor. Can be nullptr. Data type supported:Same as @p input.
80 * @param[out] output Destination tensor. Its shape should be equal to the output of a matrix multiplication between:
81 * - The output of im2col on the input and the (transposed) 2D weights, if the function is called after a Convolution Layer
82 * - The input tensor and the (transposed) 2D weights, if the function is called after another FullyConnected Layer.
83 * Data type supported: Same as @p input.
84 * @param[in] fc_info (Optional) Fully connected layer additional info
85 */
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010086 void configure(const CLCompileContext &compile_context,
87 const ICLTensor *input,
88 const ICLTensor *weights,
89 const ICLTensor *biases,
90 ICLTensor *output,
Manuel Bottini2b84be52020-04-08 10:15:51 +010091 FullyConnectedLayerInfo fc_info = FullyConnectedLayerInfo());
Georgios Pinitas529b5a22021-07-27 15:55:30 +010092 /** Set the input and output tensors.
93 *
94 * Similar to @ref CLFullyConnectedLayer
95 */
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +010096 void configure(const ICLTensor *input,
97 const ICLTensor *weights,
98 const ICLTensor *biases,
99 ICLTensor *output,
Georgios Pinitas529b5a22021-07-27 15:55:30 +0100100 FullyConnectedLayerInfo fc_info = FullyConnectedLayerInfo());
Georgios Pinitas358ca202017-12-07 16:47:52 +0000101 /** Static function to check if given info will lead to a valid configuration of @ref CLFullyConnectedLayer
102 *
Georgios Pinitas529b5a22021-07-27 15:55:30 +0100103 * Similar to @ref CLFullyConnectedLayer
Georgios Pinitas358ca202017-12-07 16:47:52 +0000104 *
105 * @return a status
106 */
Felix Thomasmathibalanafd38f02023-09-27 17:46:17 +0100107 static Status validate(const ITensorInfo *input,
108 const ITensorInfo *weights,
109 const ITensorInfo *biases,
110 const ITensorInfo *output,
Georgios Pinitas7d66a8e2018-07-17 12:28:42 +0100111 FullyConnectedLayerInfo fc_info = FullyConnectedLayerInfo());
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100112
113 //Inherited methods override
114 void run() override;
Georgios Pinitase0437672018-05-02 14:07:55 +0100115 void prepare() override;
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100116
117private:
Georgios Pinitas529b5a22021-07-27 15:55:30 +0100118 struct Impl;
119 std::unique_ptr<Impl> _impl;
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100120};
Georgios Pinitas26014cf2019-09-09 19:00:57 +0100121} // namespace arm_compute
Michalis Spyrouf4643372019-11-29 16:17:13 +0000122#endif /* ARM_COMPUTE_CLFULLYCONNECTEDLAYER_H */