blob: 87d14e5f91a4d4881c068627c5dcb4c291f0c36d [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
2 * Copyright (c) 2017 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#ifndef __ARM_COMPUTE_NEPOOLINGLAYERKERNEL_H__
25#define __ARM_COMPUTE_NEPOOLINGLAYERKERNEL_H__
26
27#include "arm_compute/core/NEON/INEKernel.h"
28
29namespace arm_compute
30{
31class ITensor;
32
33/** Interface for the pooling layer kernel */
34class NEPoolingLayerKernel : public INEKernel
35{
36public:
37 /** Default constructor */
38 NEPoolingLayerKernel();
39 /** Prevent instances of this class from being copied (As this class contains pointers) */
40 NEPoolingLayerKernel(const NEPoolingLayerKernel &) = delete;
41 /** Prevent instances of this class from being copied (As this class contains pointers) */
42 NEPoolingLayerKernel &operator=(const NEPoolingLayerKernel &) = delete;
43 /** Allow instances of this class to be moved */
44 NEPoolingLayerKernel(NEPoolingLayerKernel &&) = default;
45 /** Allow instances of this class to be moved */
46 NEPoolingLayerKernel &operator=(NEPoolingLayerKernel &&) = default;
47 /** Default destructor */
48 ~NEPoolingLayerKernel() = default;
49 /** Set the input and output tensors.
50 *
Gian Marco Iodice16824302017-09-28 15:41:37 +010051 * @note QS8, QS16 and F16 are supported for pool sizes 2 and 3 only
52 *
Michalis Spyroubbd9fb92017-06-22 12:57:51 +010053 * @param[in] input Source tensor. Data types supported: QS8/QS16/F16/F32.
Anthony Barbier6ff3b192017-09-04 18:44:23 +010054 * @param[out] output Destination tensor. Data types supported: Same as @p input.
55 * @param[in] pool_info Contains pooling operation information described in @ref PoolingLayerInfo.
56 */
57 void configure(const ITensor *input, ITensor *output, const PoolingLayerInfo &pool_info);
Michalis Spyrouafa5d812017-11-30 14:25:57 +000058 /** Static function to check if given info will lead to a valid configuration of @ref NEPoolingLayerKernel
59 *
60 * @note QS8, QS16 and F16 are supported for pool sizes 2 and 3 only
61 *
62 * @param[in] input Source tensor. Data types supported: QS8/QS16/F16/F32.
63 * @param[in] output Destination tensor. Data types supported: Same as @p input.
64 * @param[in] pool_info Contains pooling operation information described in @ref PoolingLayerInfo.
65 *
66 * @return a status
67 */
68 static Status validate(const ITensorInfo *input, const ITensorInfo *output, const PoolingLayerInfo &pool_info);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010069
70 // Inherited methods overridden:
Moritz Pflanzerc186b572017-09-07 09:48:04 +010071 void run(const Window &window, const ThreadInfo &info) override;
Anthony Barbier6ff3b192017-09-04 18:44:23 +010072 BorderSize border_size() const override;
73
74private:
75 /** Function to perform 2x2 pooling.
76 *
77 * @param[in] window_input Input region on which to execute the kernel.
78 * @param[in] window Output region on which to execute the kernel.
79 */
Georgios Pinitasadaae7e2017-10-30 15:56:32 +000080 template <PoolingType pooling_type, bool exclude_padding = false>
Anthony Barbier6ff3b192017-09-04 18:44:23 +010081 void pooling2_f32(const Window &window_input, const Window &window);
Pablo Tello0c34fe22017-06-26 17:17:42 +010082 /** Function to perform 2x2 pooling for float16_t.
83 *
84 * @param[in] window_input Input region on which to execute the kernel.
85 * @param[in] window Output region on which to execute the kernel.
86 */
Georgios Pinitasadaae7e2017-10-30 15:56:32 +000087 template <PoolingType pooling_type, bool exclude_padding = false>
Pablo Tello0c34fe22017-06-26 17:17:42 +010088 void pooling2_f16(const Window &window_input, const Window &window);
89
Anthony Barbier6ff3b192017-09-04 18:44:23 +010090 /** Function to perform 2x2 pooling for 8bit fixed point.
91 *
92 * @param[in] window_input Input region on which to execute the kernel.
93 * @param[in] window Output region on which to execute the kernel.
94 */
95 template <PoolingType pooling_type>
96 void pooling2_q8(const Window &window_input, const Window &window);
Michalis Spyroubbd9fb92017-06-22 12:57:51 +010097 /** Function to perform 2x2 pooling for 16bit fixed point.
98 *
99 * @param[in] window_input Input region on which to execute the kernel.
100 * @param[in] window Output region on which to execute the kernel.
101 */
102 template <PoolingType pooling_type>
103 void pooling2_q16(const Window &window_input, const Window &window);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100104 /** Function to perform 3x3 pooling.
105 *
106 * @param[in] window_input Input region on which to execute the kernel.
107 * @param[in] window Output region on which to execute the kernel.
108 */
Georgios Pinitasadaae7e2017-10-30 15:56:32 +0000109 template <PoolingType pooling_type, bool exclude_padding = false>
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100110 void pooling3_f32(const Window &window_input, const Window &window);
Pablo Tello0c34fe22017-06-26 17:17:42 +0100111 /** Function to perform 3x3 pooling.
112 *
113 * @param[in] window_input Input region on which to execute the kernel.
114 * @param[in] window Output region on which to execute the kernel.
115 */
Georgios Pinitasadaae7e2017-10-30 15:56:32 +0000116 template <PoolingType pooling_type, bool exclude_padding = false>
Pablo Tello0c34fe22017-06-26 17:17:42 +0100117 void pooling3_f16(const Window &window_input, const Window &window);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100118 /** Function to perform 3x3 pooling for 8bit fixed point.
119 *
120 * @param[in] window_input Input region on which to execute the kernel.
121 * @param[in] window Output region on which to execute the kernel.
122 */
123 template <PoolingType pooling_type>
124 void pooling3_q8(const Window &window_input, const Window &window);
Michalis Spyroubbd9fb92017-06-22 12:57:51 +0100125 /** Function to perform 3x3 pooling for 16bit fixed point.
126 *
127 * @param[in] window_input Input region on which to execute the kernel.
128 * @param[in] window Output region on which to execute the kernel.
129 */
130 template <PoolingType pooling_type>
131 void pooling3_q16(const Window &window_input, const Window &window);
Michele Di Giorgio8af2dd62017-06-19 15:19:29 +0100132 /** Function to perform 7x7 pooling.
133 *
134 * @param[in] window_input Input region on which to execute the kernel.
135 * @param[in] window Output region on which to execute the kernel.
136 */
Georgios Pinitasadaae7e2017-10-30 15:56:32 +0000137 template <PoolingType pooling_type, bool exclude_padding = false>
Michele Di Giorgio8af2dd62017-06-19 15:19:29 +0100138 void pooling7_f32(const Window &window_input, const Window &window);
Gian Marco Iodice16824302017-09-28 15:41:37 +0100139 /** Function to perform NxN pooling.
140 *
141 * @param[in] window_input Input region on which to execute the kernel.
142 * @param[in] window Output region on which to execute the kernel.
143 */
Georgios Pinitasadaae7e2017-10-30 15:56:32 +0000144 template <PoolingType pooling_type, bool exclude_padding = false>
Gian Marco Iodice16824302017-09-28 15:41:37 +0100145 void poolingN_f32(const Window &window_input, const Window &window);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100146 /** Common signature for all the specialised Pooling functions
147 *
148 * @param[in] window_input Input region on which to execute the kernel.
149 * @param[in] window Output region on which to execute the kernel.
150 */
151 using PoolingFunction = void (NEPoolingLayerKernel::*)(const Window &window_input, const Window &window);
152
153private:
154 PoolingFunction _func;
155 const ITensor *_input;
156 ITensor *_output;
157 PoolingLayerInfo _pool_info;
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000158 unsigned int _num_elems_processed_per_iteration;
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100159 BorderSize _border_size;
160};
Gian Marco Iodice356f6432017-09-22 11:32:21 +0100161} // namespace arm_compute
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100162#endif /*__ARM_COMPUTE_NEPOOLINGLAYERKERNEL_H__ */