blob: a3786db5b7c2f024ecb14364585e0253fc28be8e [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
Michele Di Giorgiod9eaf612020-07-08 11:12:57 +01002 * Copyright (c) 2016-2020 Arm Limited.
Anthony Barbier6ff3b192017-09-04 18:44:23 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Michalis Spyrouf4643372019-11-29 16:17:13 +000024#ifndef ARM_COMPUTE_NESCALEKERNEL_H
25#define ARM_COMPUTE_NESCALEKERNEL_H
Anthony Barbier6ff3b192017-09-04 18:44:23 +010026
Sang-Hoon Parkc2617982020-05-20 22:13:47 +010027#include "arm_compute/core/KernelDescriptors.h"
Michalis Spyrouebcebf12020-10-21 00:04:14 +010028#include "src/core/NEON/INEKernel.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010029
30namespace arm_compute
31{
32class ITensor;
33
34/** NEON kernel to perform scaling on a tensor */
35class NEScaleKernel : public INEKernel
36{
37public:
Anthony Barbiere8a49832018-01-18 10:04:05 +000038 const char *name() const override
39 {
40 return "NEScaleKernel";
41 }
Anthony Barbier6ff3b192017-09-04 18:44:23 +010042 /** Default constructor */
43 NEScaleKernel();
44 /** Prevent instances of this class from being copied (As this class contains pointers) */
45 NEScaleKernel(const NEScaleKernel &) = delete;
46 /** Prevent instances of this class from being copied (As this class contains pointers) */
47 NEScaleKernel &operator=(const NEScaleKernel &) = delete;
48 /** Allow instances of this class to be moved */
49 NEScaleKernel(NEScaleKernel &&) = default;
50 /** Allow instances of this class to be moved */
51 NEScaleKernel &operator=(NEScaleKernel &&) = default;
52 /** Default destructor */
53 ~NEScaleKernel() = default;
54
55 /** Initialise the kernel's inputs, output and interpolation policy
56 *
57 * @note dx, dy and offsets have the same dimensions (width and height) of the output tensor
George Wort05398a92019-01-25 15:38:33 +000058 * @note Using @p policy Area only supports data layout NCHW and input data type U8.
Anthony Barbier6ff3b192017-09-04 18:44:23 +010059 *
Sang-Hoon Parkc2617982020-05-20 22:13:47 +010060 * @param[in] input Source tensor. Data types supported: QASYMM8/QASYMM8_SIGNED/U8/S16/F16/F32.
61 * @param[in] dx Pixel's distance between the X real coordinate and the smallest X following integer. Data type supported: F32
62 * @param[in] dy Pixel's distance between the Y real coordinate and the smallest Y following integer. Data type supported: F32
63 * @param[in] offsets Offset to access the pixel with NEAREST interpolation or the top-left pixel with BILINEAR interpolation in the input tensor. Data type supported: S32.
64 * @param[out] output Destination tensor. Data types supported: Same as @p input. All but the lowest two dimensions must be the same size as in the input tensor, i.e. scaling is only performed within the XY-plane.
65 * @param[in] info @ref ScaleKernelInfo to use for configuration
Anthony Barbier6ff3b192017-09-04 18:44:23 +010066 */
Georgios Pinitas393fa4c2018-05-08 15:54:53 +010067 void configure(const ITensor *input, const ITensor *dx, const ITensor *dy, const ITensor *offsets, ITensor *output,
Sang-Hoon Parkc2617982020-05-20 22:13:47 +010068 const ScaleKernelInfo &info);
Georgios Pinitas20b43132018-05-14 16:05:23 +010069 /** Static function to check if given info will lead to a valid configuration of @ref NEScaleKernel
70 *
71 * @note dx, dy and offsets have the same dimensions (width and height) of the output tensor
George Wort05398a92019-01-25 15:38:33 +000072 * @note Using @p policy Area only supports data layout NCHW and input data type U8.
Georgios Pinitas20b43132018-05-14 16:05:23 +010073 *
Sang-Hoon Parkc2617982020-05-20 22:13:47 +010074 * @param[in] input Source tensor. Data types supported: QASYMM8/QASYMM8_SIGNED/U8/S16/F16/F32.
75 * @param[in] dx Pixel's distance between the X real coordinate and the smallest X following integer. Data type supported: F32
76 * @param[in] dy Pixel's distance between the Y real coordinate and the smallest Y following integer. Data type supported: F32
77 * @param[in] offsets Offset to access the pixel with NEAREST interpolation or the top-left pixel with BILINEAR interpolation in the input tensor. Data type supported: S32.
78 * @param[in] output Destination tensor. Data types supported: Same as @p input. All but the lowest two dimensions must be the same size as in the input tensor, i.e. scaling is only performed within the XY-plane.
79 * @param[in] info @ref ScaleKernelInfo to use for validation
Georgios Pinitas20b43132018-05-14 16:05:23 +010080 */
81 static Status validate(const ITensorInfo *input, const ITensorInfo *dx, const ITensorInfo *dy, const ITensorInfo *offsets, ITensorInfo *output,
Sang-Hoon Parkc2617982020-05-20 22:13:47 +010082 const ScaleKernelInfo &info);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010083
84 // Inherited methods overridden:
Moritz Pflanzerc186b572017-09-07 09:48:04 +010085 void run(const Window &window, const ThreadInfo &info) override;
Anthony Barbier6ff3b192017-09-04 18:44:23 +010086
87private:
Anthony Barbier6ff3b192017-09-04 18:44:23 +010088 /** function to perform scale using area interpolation on the given window
89 *
90 * @note Used only in case down-sampling.
91 */
Manuel Bottinifc2f6d02020-08-26 16:28:38 +010092 void scale_area_nchw_u8(const Window &window);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010093
Manuel Bottinifc2f6d02020-08-26 16:28:38 +010094 /** function to perform scale using bilinear interpolation on the given window */
95 template <typename T>
96 void scale_bilinear_nchw(const Window &window);
97 /** function to perform scale using bilinear interpolation on the given window */
98 template <typename T>
99 void scale_bilinear_nhwc(const Window &window);
100 /** function to perform scale using bilinear interpolation on the given window */
101 template <typename T>
102 void scale_bilinear_qasymm(const Window &window);
103
104 /** function to perform scale using nearest neighbour on the given window */
105 template <typename T>
106 void scale_nearest_nchw(const Window &window);
107 /** function to perform scale using nearest neighbour on the given window */
108 template <typename T>
109 void scale_nearest_nhwc(const Window &window);
110
111 /** Scale function to use for the particular function to use */
112 using ScaleFunctionPtr = void (NEScaleKernel::*)(const Window &window);
113
114 ScaleFunctionPtr _func;
Georgios Pinitas393fa4c2018-05-08 15:54:53 +0100115 const ITensor *_offsets;
116 const ITensor *_dx;
117 const ITensor *_dy;
118 const ITensor *_input;
119 ITensor *_output;
120 InterpolationPolicy _policy;
Georgios Pinitas393fa4c2018-05-08 15:54:53 +0100121 BorderMode _border_mode;
George Wort05398a92019-01-25 15:38:33 +0000122 PixelValue _constant_border_value;
Vidhya Sudhan Loganathan3ac2f3a2019-01-17 15:16:19 +0000123 float _sampling_offset;
Sang-Hoon Parkbb123bd2020-01-03 10:57:30 +0000124 bool _align_corners;
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100125};
Gian Marco Iodice356f6432017-09-22 11:32:21 +0100126} // namespace arm_compute
Michalis Spyrouf4643372019-11-29 16:17:13 +0000127#endif /*ARM_COMPUTE_NESCALEKERNEL_H */