blob: 52a09d9a49c2eb8c792c5f3d884ff39486b1c6bb [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
Michele Di Giorgiocbbed282019-12-20 13:26:08 +00002 * Copyright (c) 2016-2020 ARM Limited.
Anthony Barbier6ff3b192017-09-04 18:44:23 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Michalis Spyrouf4643372019-11-29 16:17:13 +000024#ifndef ARM_COMPUTE_CLPIXELWISEMULTIPLICATIONKERNEL_H
25#define ARM_COMPUTE_CLPIXELWISEMULTIPLICATIONKERNEL_H
Anthony Barbier6ff3b192017-09-04 18:44:23 +010026
27#include "arm_compute/core/CL/ICLKernel.h"
28#include "arm_compute/core/Types.h"
29
30namespace arm_compute
31{
Georgios Pinitas8be91482019-03-26 17:23:28 +000032// Forward declarations
Anthony Barbier6ff3b192017-09-04 18:44:23 +010033class ICLTensor;
34
Georgios Pinitas8be91482019-03-26 17:23:28 +000035/** Interface for the pixelwise multiplication kernel. */
Anthony Barbier6ff3b192017-09-04 18:44:23 +010036class CLPixelWiseMultiplicationKernel : public ICLKernel
37{
38public:
39 /** Default constructor.*/
40 CLPixelWiseMultiplicationKernel();
Alex Gildayc357c472018-03-21 13:54:09 +000041 /** Prevent instances of this class from being copied (As this class contains pointers) */
Anthony Barbier6ff3b192017-09-04 18:44:23 +010042 CLPixelWiseMultiplicationKernel(const CLPixelWiseMultiplicationKernel &) = delete;
Alex Gildayc357c472018-03-21 13:54:09 +000043 /** Prevent instances of this class from being copied (As this class contains pointers) */
Anthony Barbier6ff3b192017-09-04 18:44:23 +010044 CLPixelWiseMultiplicationKernel &operator=(const CLPixelWiseMultiplicationKernel &) = delete;
45 /** Allow instances of this class to be moved */
46 CLPixelWiseMultiplicationKernel(CLPixelWiseMultiplicationKernel &&) = default;
47 /** Allow instances of this class to be moved */
48 CLPixelWiseMultiplicationKernel &operator=(CLPixelWiseMultiplicationKernel &&) = default;
49 /** Initialise the kernel's input, output and border mode.
50 *
Michele Di Giorgiocbbed282019-12-20 13:26:08 +000051 * @param[in] input1 An input tensor. Data types supported: U8/QASYMM8/QASYMM8_SIGNED/S16/QSYMM16/F16/F32.
Michele Di Giorgioab0a77e2017-06-21 15:36:24 +010052 * @param[in] input2 An input tensor. Data types supported: same as @p input1.
Michele Di Giorgio7a0212a2020-04-14 16:08:32 +010053 * @param[out] output The output tensor, Data types supported:
54 * - U8, only if both input are U8
55 * - QASYMM8, only if both inputs are QASYMM8
56 * - QASYMM8_SIGNED, only if both inputs are QASYMM8_SIGNED
57 * - S16
58 * - QSYMM16, only if both inputs are QSYMM16
59 * - S32, only if both inputs are QSYMM16
60 * - F16
61 * - F32
Anthony Barbier6ff3b192017-09-04 18:44:23 +010062 * @param[in] scale Scale to apply after multiplication.
Vidhya Sudhan Loganathan7485d5a2018-07-04 09:34:00 +010063 * Scale must be positive and its value must be either 1/255 or 1/2^n where n is between 0 and 15.
Anthony Barbier6ff3b192017-09-04 18:44:23 +010064 * @param[in] overflow_policy Overflow policy. Supported overflow policies: Wrap, Saturate
65 * @param[in] rounding_policy Rounding policy. Supported rounding modes: to zero, to nearest even.
Giorgio Arena8b2a7d32020-02-11 17:21:31 +000066 * @param[in] act_info (Optional) Activation layer information in case of a fused activation.
Anthony Barbier6ff3b192017-09-04 18:44:23 +010067 */
68 void configure(const ICLTensor *input1, const ICLTensor *input2, ICLTensor *output, float scale,
Giorgio Arena8b2a7d32020-02-11 17:21:31 +000069 ConvertPolicy overflow_policy, RoundingPolicy rounding_policy, const ActivationLayerInfo &act_info = ActivationLayerInfo());
Manuel Bottini4c6bd512020-04-08 10:15:51 +010070 /** Initialise the kernel's input, output and border mode.
71 *
72 * @param[in] compile_context The compile context to be used.
73 * @param[in] input1 An input tensor. Data types supported: U8/QASYMM8/QASYMM8_SIGNED/S16/QSYMM16/F16/F32.
74 * @param[in] input2 An input tensor. Data types supported: same as @p input1.
75 * @param[out] output The output tensor, Data types supported: same as @p input1. Note: U8 requires both inputs to be U8.
76 * @param[in] scale Scale to apply after multiplication.
77 * Scale must be positive and its value must be either 1/255 or 1/2^n where n is between 0 and 15.
78 * @param[in] overflow_policy Overflow policy. Supported overflow policies: Wrap, Saturate
79 * @param[in] rounding_policy Rounding policy. Supported rounding modes: to zero, to nearest even.
80 * @param[in] act_info (Optional) Activation layer information in case of a fused activation.
81 */
Manuel Bottini679fc962020-04-21 16:08:53 +010082 void configure(const CLCompileContext &compile_context, const ICLTensor *input1, const ICLTensor *input2, ICLTensor *output, float scale,
Manuel Bottini4c6bd512020-04-08 10:15:51 +010083 ConvertPolicy overflow_policy, RoundingPolicy rounding_policy, const ActivationLayerInfo &act_info = ActivationLayerInfo());
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000084 /** Static function to check if given info will lead to a valid configuration of @ref CLPixelWiseMultiplicationKernel
85 *
Michele Di Giorgiocbbed282019-12-20 13:26:08 +000086 * @param[in] input1 An input tensor info. Data types supported: U8/QASYMM8/QASYMM8_SIGNED/S16/QSYMM16/F16/F32.
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000087 * @param[in] input2 An input tensor info. Data types supported: same as @p input1.
Michele Di Giorgio7a0212a2020-04-14 16:08:32 +010088 * @param[in] output The output tensor info, Data types supported:
89 * - U8, only if both input are U8
90 * - QASYMM8, only if both inputs are QASYMM8
91 * - QASYMM8_SIGNED, only if both inputs are QASYMM8_SIGNED
92 * - S16
93 * - QSYMM16, only if both inputs are QSYMM16
94 * - S32, only if both inputs are QSYMM16
95 * - F16
96 * - F32
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000097 * @param[in] scale Scale to apply after multiplication.
Vidhya Sudhan Loganathan7485d5a2018-07-04 09:34:00 +010098 * Scale must be positive and its value must be either 1/255 or 1/2^n where n is between 0 and 15.
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000099 * @param[in] overflow_policy Overflow policy. Supported overflow policies: Wrap, Saturate
100 * @param[in] rounding_policy Rounding policy. Supported rounding modes: to zero, to nearest even.
Giorgio Arena8b2a7d32020-02-11 17:21:31 +0000101 * @param[in] act_info (Optional) Activation layer information in case of a fused activation.
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +0000102 *
Georgios Pinitas631c41a2017-12-06 11:53:03 +0000103 * @return a status
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +0000104 */
Georgios Pinitas631c41a2017-12-06 11:53:03 +0000105 static Status validate(const ITensorInfo *input1, const ITensorInfo *input2, const ITensorInfo *output, float scale,
Giorgio Arena8b2a7d32020-02-11 17:21:31 +0000106 ConvertPolicy overflow_policy, RoundingPolicy rounding_policy, const ActivationLayerInfo &act_info = ActivationLayerInfo());
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100107
108 // Inherited methods overridden:
109 void run(const Window &window, cl::CommandQueue &queue) override;
Michele Di Giorgio6259e5f2018-01-17 17:29:33 +0000110 BorderSize border_size() const override;
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100111
112private:
113 const ICLTensor *_input1;
114 const ICLTensor *_input2;
115 ICLTensor *_output;
116};
Georgios Pinitas8be91482019-03-26 17:23:28 +0000117
118/** Interface for the complex pixelwise multiplication kernel. */
119class CLComplexPixelWiseMultiplicationKernel : public ICLKernel
120{
121public:
122 /** Default constructor.*/
123 CLComplexPixelWiseMultiplicationKernel();
124 /** Prevent instances of this class from being copied (As this class contains pointers) */
125 CLComplexPixelWiseMultiplicationKernel(const CLComplexPixelWiseMultiplicationKernel &) = delete;
126 /** Prevent instances of this class from being copied (As this class contains pointers) */
127 CLComplexPixelWiseMultiplicationKernel &operator=(const CLComplexPixelWiseMultiplicationKernel &) = delete;
128 /** Allow instances of this class to be moved */
129 CLComplexPixelWiseMultiplicationKernel(CLComplexPixelWiseMultiplicationKernel &&) = default;
130 /** Allow instances of this class to be moved */
131 CLComplexPixelWiseMultiplicationKernel &operator=(CLComplexPixelWiseMultiplicationKernel &&) = default;
132 /** Initialise the kernel's input, output and border mode.
133 *
Giorgio Arena8b2a7d32020-02-11 17:21:31 +0000134 * @param[in] input1 An input tensor. Data types supported: F32. Number of channels supported: 2.
135 * @param[in] input2 An input tensor. Data types supported: same as @p input1. Number of channels supported: same as @p input1.
136 * @param[out] output The output tensor, Data types supported: same as @p input1. Number of channels supported: same as @p input1.
137 * @param[in] act_info (Optional) Activation layer information in case of a fused activation.
Georgios Pinitas8be91482019-03-26 17:23:28 +0000138 */
Giorgio Arena8b2a7d32020-02-11 17:21:31 +0000139 void configure(const ICLTensor *input1, const ICLTensor *input2, ICLTensor *output, const ActivationLayerInfo &act_info = ActivationLayerInfo());
Manuel Bottini4c6bd512020-04-08 10:15:51 +0100140 /** Initialise the kernel's input, output and border mode.
141 *
142 * @param[in] compile_context The compile context to be used.
143 * @param[in] input1 An input tensor. Data types supported: F32. Number of channels supported: 2.
144 * @param[in] input2 An input tensor. Data types supported: same as @p input1. Number of channels supported: same as @p input1.
145 * @param[out] output The output tensor, Data types supported: same as @p input1. Number of channels supported: same as @p input1.
146 * @param[in] act_info (Optional) Activation layer information in case of a fused activation.
147 */
Manuel Bottini679fc962020-04-21 16:08:53 +0100148 void configure(const CLCompileContext &compile_context, const ICLTensor *input1, const ICLTensor *input2, ICLTensor *output, const ActivationLayerInfo &act_info = ActivationLayerInfo());
Georgios Pinitas8be91482019-03-26 17:23:28 +0000149 /** Static function to check if given info will lead to a valid configuration of @ref CLComplexPixelWiseMultiplicationKernel
150 *
Giorgio Arena8b2a7d32020-02-11 17:21:31 +0000151 * @param[in] input1 An input tensor info. Data types supported: F32. Number of channels supported: 2.
152 * @param[in] input2 An input tensor info. Data types supported: same as @p input1. Number of channels supported: same as @p input1.
153 * @param[in] output The output tensor info. Data types supported: same as @p input1. Number of channels supported: same as @p input1.
154 * @param[in] act_info (Optional) Activation layer information in case of a fused activation.
Georgios Pinitas8be91482019-03-26 17:23:28 +0000155 *
156 * @return a status
157 */
Giorgio Arena8b2a7d32020-02-11 17:21:31 +0000158 static Status validate(const ITensorInfo *input1, const ITensorInfo *input2, const ITensorInfo *output, const ActivationLayerInfo &act_info = ActivationLayerInfo());
Georgios Pinitas8be91482019-03-26 17:23:28 +0000159
160 // Inherited methods overridden:
161 void run(const Window &window, cl::CommandQueue &queue) override;
162 BorderSize border_size() const override;
163
164private:
165 const ICLTensor *_input1;
166 const ICLTensor *_input2;
167 ICLTensor *_output;
168};
Gian Marco Iodicef670a0a2017-09-18 12:20:45 +0100169} // namespace arm_compute
Michalis Spyrouf4643372019-11-29 16:17:13 +0000170#endif /*ARM_COMPUTE_CLPIXELWISEMULTIPLICATIONKERNEL_H */