blob: 24790d16d7b9beb5539ec90bd568dc7c5af2f727 [file] [log] [blame]
Manuel Bottini10b38262021-02-19 18:16:44 +00001/*
Michalis Spyrouc5b1bee2021-04-06 11:54:03 +01002 * Copyright (c) 2016-2021 Arm Limited.
Manuel Bottini10b38262021-02-19 18:16:44 +00003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#ifndef ARM_COMPUTE_CPU_SCALEKERNEL_H
25#define ARM_COMPUTE_CPU_SCALEKERNEL_H
26
27#include "arm_compute/core/KernelDescriptors.h"
28#include "src/core/common/Macros.h"
29#include "src/core/cpu/ICpuKernel.h"
30
31namespace arm_compute
32{
33namespace cpu
34{
35namespace kernels
36{
37/** Arm(R) Neon(TM) kernel to perform scaling on a tensor */
38class CpuScaleKernel : public ICpuKernel
39{
40public:
41 /** Default constructor */
42 CpuScaleKernel();
43 ARM_COMPUTE_DISALLOW_COPY_ALLOW_MOVE(CpuScaleKernel);
44 /** Initialise the kernel's inputs, output and interpolation policy
45 *
46 * @note dx, dy and offsets have the same dimensions (width and height) of the output tensor
47 * @note Using @p policy Area only supports data layout NCHW and input data type U8.
48 *
49 * @param[in] src Source tensor info. Data types supported: QASYMM8/QASYMM8_SIGNED/U8/S16/F16/F32.
50 * @param[in] dx Distance x tensor info. Pixel's distance between the X real coordinate and the smallest X following integer. Data type supported: F32
51 * @param[in] dy Distance y tensor info. Pixel's distance between the Y real coordinate and the smallest Y following integer. Data type supported: F32
52 * @param[in] offsets Offset tensor info. Offset to access the pixel with NEAREST interpolation or the top-left pixel with BILINEAR interpolation in the input tensor. Data type supported: S32.
53 * @param[out] dst Destination tensor info. Data types supported: Same as @p input. All but the lowest two dimensions must be the same size as in the input tensor, i.e. scaling is only performed within the XY-plane.
54 * @param[in] info @ref ScaleKernelInfo to use for configuration
55 */
56 void configure(const ITensorInfo *src, const ITensorInfo *dx, const ITensorInfo *dy, const ITensorInfo *offsets, ITensorInfo *dst,
57 const ScaleKernelInfo &info);
58 /** Static function to check if given info will lead to a valid configuration of @ref CpuScaleKernel
59 *
60 * @note dx, dy and offsets have the same dimensions (width and height) of the output tensor
61 * @note Using @p policy Area only supports data layout NCHW and input data type U8.
62 *
63 * @param[in] src Source tensor. Data types supported: QASYMM8/QASYMM8_SIGNED/U8/S16/F16/F32.
64 * @param[in] dx Distance x tensor info. Pixel's distance between the X real coordinate and the smallest X following integer. Data type supported: F32
65 * @param[in] dy Distance y tensor info. Pixel's distance between the Y real coordinate and the smallest Y following integer. Data type supported: F32
66 * @param[in] offsets Offset tensor info. Offset to access the pixel with NEAREST interpolation or the top-left pixel with BILINEAR interpolation in the input tensor. Data type supported: S32.
67 * @param[in] dst Destination tensor info. Data types supported: Same as @p input. All but the lowest two dimensions must be the same size as in the input tensor, i.e. scaling is only performed within the XY-plane.
68 * @param[in] info @ref ScaleKernelInfo to use for validation
69 */
70 static Status validate(const ITensorInfo *src, const ITensorInfo *dx, const ITensorInfo *dy, const ITensorInfo *offsets, ITensorInfo *dst,
71 const ScaleKernelInfo &info);
72
73 // Inherited methods overridden:
74 void run_op(ITensorPack &tensors, const Window &window, const ThreadInfo &info) override;
75 const char *name() const override;
76
77private:
78#ifdef ENABLE_NCHW_KERNELS
79 /** function to perform scale using area interpolation on the given window
80 *
81 * @note Used only in case down-sampling.
82 */
83 void scale_area_nchw_u8(const ITensor *src, ITensor *dst, const ITensor *dx, const ITensor *dy, const ITensor *offsets, const Window &window);
84
85 /** function to perform scale using bilinear interpolation on the given window */
86 template <typename T>
87 void scale_bilinear_nchw(const ITensor *src, ITensor *dst, const ITensor *dx, const ITensor *dy, const ITensor *offsets, const Window &window);
88 /** function to perform scale using bilinear interpolation on the given window */
89 template <typename T>
90 void scale_bilinear_qasymm(const ITensor *src, ITensor *dst, const ITensor *dx, const ITensor *dy, const ITensor *offsets, const Window &window);
91
92 /** function to perform scale using nearest neighbour on the given window */
93 template <typename T>
94 void scale_nearest_nchw(const ITensor *src, ITensor *dst, const ITensor *dx, const ITensor *dy, const ITensor *offsets, const Window &window);
95#endif // ENABLE_NCHW_KERNELS
96
97 /** Scale function to use for the particular function to use */
98 using ScaleFunctionPtr = void (CpuScaleKernel::*)(const ITensor *, ITensor *, const ITensor *, const ITensor *, const ITensor *, const Window &window);
99
100 ScaleFunctionPtr _func;
101 InterpolationPolicy _policy;
102 BorderMode _border_mode;
103 PixelValue _constant_border_value;
104 float _sampling_offset;
105 bool _align_corners;
106 DataLayout _data_layout;
107};
108} // namespace kernels
109} // namespace cpu
110} // namespace arm_compute
111#endif /*ARM_COMPUTE_CPU_SCALEKERNEL_H */