blob: b835aa701b2d6da2e4b48272bae1dfed9261dcba [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
Michele Di Giorgio6259e5f2018-01-17 17:29:33 +00002 * Copyright (c) 2016-2018 ARM Limited.
Anthony Barbier6ff3b192017-09-04 18:44:23 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#ifndef __ARM_COMPUTE_CLPIXELWISEMULTIPLICATIONKERNEL_H__
25#define __ARM_COMPUTE_CLPIXELWISEMULTIPLICATIONKERNEL_H__
26
27#include "arm_compute/core/CL/ICLKernel.h"
28#include "arm_compute/core/Types.h"
29
30namespace arm_compute
31{
32class ICLTensor;
33
34/** Interface for the pixelwise multiplication kernel.
35 *
36 */
37class CLPixelWiseMultiplicationKernel : public ICLKernel
38{
39public:
40 /** Default constructor.*/
41 CLPixelWiseMultiplicationKernel();
Alex Gildayc357c472018-03-21 13:54:09 +000042 /** Prevent instances of this class from being copied (As this class contains pointers) */
Anthony Barbier6ff3b192017-09-04 18:44:23 +010043 CLPixelWiseMultiplicationKernel(const CLPixelWiseMultiplicationKernel &) = delete;
Alex Gildayc357c472018-03-21 13:54:09 +000044 /** Prevent instances of this class from being copied (As this class contains pointers) */
Anthony Barbier6ff3b192017-09-04 18:44:23 +010045 CLPixelWiseMultiplicationKernel &operator=(const CLPixelWiseMultiplicationKernel &) = delete;
46 /** Allow instances of this class to be moved */
47 CLPixelWiseMultiplicationKernel(CLPixelWiseMultiplicationKernel &&) = default;
48 /** Allow instances of this class to be moved */
49 CLPixelWiseMultiplicationKernel &operator=(CLPixelWiseMultiplicationKernel &&) = default;
50 /** Initialise the kernel's input, output and border mode.
51 *
Vidhya Sudhan Loganathan7485d5a2018-07-04 09:34:00 +010052 * @param[in] input1 An input tensor. Data types supported: U8/S16/F16/F32.
Michele Di Giorgioab0a77e2017-06-21 15:36:24 +010053 * @param[in] input2 An input tensor. Data types supported: same as @p input1.
Vidhya Sudhan Loganathan7485d5a2018-07-04 09:34:00 +010054 * @param[out] output The output tensor, Data types supported: same as @p input1. Note: U8 requires both inputs to be U8.
Anthony Barbier6ff3b192017-09-04 18:44:23 +010055 * @param[in] scale Scale to apply after multiplication.
Vidhya Sudhan Loganathan7485d5a2018-07-04 09:34:00 +010056 * Scale must be positive and its value must be either 1/255 or 1/2^n where n is between 0 and 15.
Anthony Barbier6ff3b192017-09-04 18:44:23 +010057 * @param[in] overflow_policy Overflow policy. Supported overflow policies: Wrap, Saturate
58 * @param[in] rounding_policy Rounding policy. Supported rounding modes: to zero, to nearest even.
59 */
60 void configure(const ICLTensor *input1, const ICLTensor *input2, ICLTensor *output, float scale,
61 ConvertPolicy overflow_policy, RoundingPolicy rounding_policy);
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000062 /** Static function to check if given info will lead to a valid configuration of @ref CLPixelWiseMultiplicationKernel
63 *
Vidhya Sudhan Loganathan7485d5a2018-07-04 09:34:00 +010064 * @param[in] input1 An input tensor info. Data types supported: U8/S16/F16/F32.
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000065 * @param[in] input2 An input tensor info. Data types supported: same as @p input1.
Vidhya Sudhan Loganathan7485d5a2018-07-04 09:34:00 +010066 * @param[in] output The output tensor info, Data types supported: same as @p input1. Note: U8 requires both inputs to be U8.
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000067 * @param[in] scale Scale to apply after multiplication.
Vidhya Sudhan Loganathan7485d5a2018-07-04 09:34:00 +010068 * Scale must be positive and its value must be either 1/255 or 1/2^n where n is between 0 and 15.
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000069 * @param[in] overflow_policy Overflow policy. Supported overflow policies: Wrap, Saturate
70 * @param[in] rounding_policy Rounding policy. Supported rounding modes: to zero, to nearest even.
71 *
Georgios Pinitas631c41a2017-12-06 11:53:03 +000072 * @return a status
Georgios Pinitasf9d3a0a2017-11-03 19:01:44 +000073 */
Georgios Pinitas631c41a2017-12-06 11:53:03 +000074 static Status validate(const ITensorInfo *input1, const ITensorInfo *input2, const ITensorInfo *output, float scale,
75 ConvertPolicy overflow_policy, RoundingPolicy rounding_policy);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010076
77 // Inherited methods overridden:
78 void run(const Window &window, cl::CommandQueue &queue) override;
Michele Di Giorgio6259e5f2018-01-17 17:29:33 +000079 BorderSize border_size() const override;
Anthony Barbier6ff3b192017-09-04 18:44:23 +010080
81private:
82 const ICLTensor *_input1;
83 const ICLTensor *_input2;
84 ICLTensor *_output;
85};
Gian Marco Iodicef670a0a2017-09-18 12:20:45 +010086} // namespace arm_compute
Anthony Barbier6ff3b192017-09-04 18:44:23 +010087#endif /*__ARM_COMPUTE_CLPIXELWISEMULTIPLICATIONKERNEL_H__ */