blob: 172ed8985a39fab33cd8aae86471982b313aaac6 [file] [log] [blame]
Michalis Spyrou04f089c2017-08-08 17:42:38 +01001/*
Michalis Spyroub9626ab2019-05-13 17:41:01 +01002 * Copyright (c) 2017-2019 ARM Limited.
Michalis Spyrou04f089c2017-08-08 17:42:38 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#ifndef __ARM_COMPUTE_CLREDUCTIONOPERATIONKERNEL_H__
25#define __ARM_COMPUTE_CLREDUCTIONOPERATIONKERNEL_H__
26
27#include "arm_compute/core/CL/ICLKernel.h"
28#include "arm_compute/core/Types.h"
29
30namespace arm_compute
31{
32class ICLTensor;
33
Michele Di Giorgio9637b2e2019-09-23 16:49:49 +010034/** Interface for the reduction operation kernel
35 *
Sang-Hoon Parkeaa01ab2019-11-11 17:33:28 +000036 * @note For ARG_MIN/ARG_MAX reduction, the default data type for an uninitialized
37 * output tensor is signed 32-bit integer (S32). It is the user's responsibility
38 * to check that the results do not overflow because the indices are computed
39 * in unsigned 32-bit (U32).
Michele Di Giorgio9637b2e2019-09-23 16:49:49 +010040 */
Michalis Spyrou04f089c2017-08-08 17:42:38 +010041class CLReductionOperationKernel : public ICLKernel
42{
43public:
44 /** Default constructor */
45 CLReductionOperationKernel();
46 /** Prevent instances of this class from being copied (As this class contains pointers) */
47 CLReductionOperationKernel(const CLReductionOperationKernel &) = delete;
48 /** Prevent instances of this class from being copied (As this class contains pointers) */
49 CLReductionOperationKernel &operator=(const CLReductionOperationKernel &) = delete;
50 /** Allow instances of this class to be moved */
51 CLReductionOperationKernel(CLReductionOperationKernel &&) = default;
52 /** Allow instances of this class to be moved */
53 CLReductionOperationKernel &operator=(CLReductionOperationKernel &&) = default;
54 /** Default destructor */
55 ~CLReductionOperationKernel() = default;
56
57 /** Set the input and output tensors.
58 *
Michalis Spyroub9626ab2019-05-13 17:41:01 +010059 * @param[in] input Source tensor. Data types supported: QASYMM8/S32/F16/F32.
Michele Di Giorgio9637b2e2019-09-23 16:49:49 +010060 * @param[out] output Destination tensor. Data types and data layouts supported: Same as @p input, U32/S32 for ARG_MIX/ARG_MAX.
John Richardson62385bc2018-04-20 13:11:36 +010061 * Output will have the same number of dimensions as input.
Michalis Spyrou7e9391b2018-10-05 14:49:28 +010062 * @param[in] axis Axis along which to reduce. Supported reduction axis : 0,1,2,3
Michalis Spyrou04f089c2017-08-08 17:42:38 +010063 * @param[in] op Reduction operation to perform.
Michalis Spyrou7e9391b2018-10-05 14:49:28 +010064 * @param[in] width (Optional) In case of x-axis we also need to provide the width of the input image.
Michalis Spyrou04f089c2017-08-08 17:42:38 +010065 */
Michalis Spyrou7e9391b2018-10-05 14:49:28 +010066 void configure(const ICLTensor *input, ICLTensor *output, unsigned int axis, ReductionOperation op, unsigned int width = 0);
Michalis Spyrou04f089c2017-08-08 17:42:38 +010067
John Richardson62385bc2018-04-20 13:11:36 +010068 /** Static function to check if given info will lead to a valid configuration of @ref CLReductionOperationKernel.
69 *
Michalis Spyroub9626ab2019-05-13 17:41:01 +010070 * @param[in] input Source tensor info. Data types supported: QASYMM8/S32/F16/F32.
Michele Di Giorgio9637b2e2019-09-23 16:49:49 +010071 * @param[in] output Destination tensor info. Data types and data layouts supported: Same as @p input, U32/S32 for ARG_MIX/ARG_MAX.
John Richardson62385bc2018-04-20 13:11:36 +010072 * Output will have the same number of dimensions as input.
Michalis Spyrou7e9391b2018-10-05 14:49:28 +010073 * @param[in] axis Axis along which to reduce. Supported reduction axis : 0,1,2,3
John Richardson62385bc2018-04-20 13:11:36 +010074 * @param[in] op Reduction operation to perform.
Michalis Spyrou7e9391b2018-10-05 14:49:28 +010075 * @param[in] width (Optional) In case of x-axis we also need to provide the width of the input image.
John Richardson62385bc2018-04-20 13:11:36 +010076 *
77 * @return a status
78 */
Michalis Spyrou7e9391b2018-10-05 14:49:28 +010079 static Status validate(const ITensorInfo *input, const ITensorInfo *output, unsigned int axis, ReductionOperation op, unsigned int width = 0);
John Richardson62385bc2018-04-20 13:11:36 +010080
Michalis Spyrou04f089c2017-08-08 17:42:38 +010081 // Inherited methods overridden:
82 void run(const Window &window, cl::CommandQueue &queue) override;
83 BorderSize border_size() const override;
84
85private:
86 const ICLTensor *_input;
87 ICLTensor *_output;
88 unsigned int _reduction_axis;
89 ReductionOperation _op;
90 BorderSize _border_size;
91};
Gian Marco Iodicef670a0a2017-09-18 12:20:45 +010092} // namespace arm_compute
Michalis Spyrou04f089c2017-08-08 17:42:38 +010093#endif /*__ARM_COMPUTE_CLREDUCTIONOPERATIONKERNEL_H__ */