Blame - arm_compute/core/CL/kernels/CLDepthwiseConvolutionLayer3x3NCHWKernel.h - ml/ComputeLibrary

blob: b1c730d9a7204dd4f7aa8ba5a901b9d713456ef9 [file] [log] [blame]

Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	1	/*
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	2	* Copyright (c) 2018 ARM Limited.
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	3	*
				4	* SPDX-License-Identifier: MIT
				5	*
				6	* Permission is hereby granted, free of charge, to any person obtaining a copy
				7	* of this software and associated documentation files (the "Software"), to
				8	* deal in the Software without restriction, including without limitation the
				9	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
				10	* sell copies of the Software, and to permit persons to whom the Software is
				11	* furnished to do so, subject to the following conditions:
				12	*
				13	* The above copyright notice and this permission notice shall be included in all
				14	* copies or substantial portions of the Software.
				15	*
				16	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				17	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				18	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
				19	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				20	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				21	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				22	* SOFTWARE.
				23	*/
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	24	#ifndef __ARM_COMPUTE_CLDEPTHWISECONVOLUTIONNCHWKERNEL3x3_H__
				25	#define __ARM_COMPUTE_CLDEPTHWISECONVOLUTIONNCHWKERNEL3x3_H__
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	26
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	27	#include "arm_compute/core/CL/kernels/ICLDepthwiseConvolutionLayer3x3Kernel.h"
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	28
				29	namespace arm_compute
				30	{
				31	class ICLTensor;
				32
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	33	/** Interface for the kernel to run a 3x3 depthwise convolution on a tensor when the data layout is NCHW.
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	34	*/
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	35	class CLDepthwiseConvolutionLayer3x3NCHWKernel : public ICLDepthwiseConvolutionLayer3x3Kernel
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	36	{
				37	public:
				38	/** Default constructor */
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	39	CLDepthwiseConvolutionLayer3x3NCHWKernel();
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	40	/** Initialize the function's source, destination, conv and border_size.
				41	*
Giorgio Arena	7657224	2018-04-04 17:44:26 +0100	[diff] [blame]	42	* @param[in] input Source tensor. DataType supported: QASYMM8/F16/F32.
				43	* @param[in] weights Weights tensor. A 3D tensor with dimensions [3, 3, IFM]. Data type supported: Same as @p input.
				44	* @param[in] biases (Optional) Biases tensor. A 1D tensor with dimensions [IFM]. Must be nullptr if not needed.
				45	* Data type supported: Same as @p input.
				46	* @param[out] output Destination tensor. Data type supported: Same as @p input.
				47	* @param[in] conv_info Padding and stride information to use for the convolution.
				48	* @param[in] depth_multiplier (Optional) Multiplier to apply to the input's depth in order to retrieve the output's depth. Defaults to 1.
				49	* @param[in] act_info (Optional) Activation layer information in case of a fused activation. Only RELU, BOUNDED_RELU and LU_BOUNDED_RELU for QASYMM8 supported.
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	50	*/
Giorgio Arena	7657224	2018-04-04 17:44:26 +0100	[diff] [blame]	51	void configure(const ICLTensor input, const ICLTensor weights, const ICLTensor biases, ICLTensor output, const PadStrideInfo &conv_info, unsigned int depth_multiplier,
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	52	ActivationLayerInfo act_info) override;
Giorgio Arena	ad0c738	2018-04-23 16:16:21 +0100	[diff] [blame]	53	/** Static function to check if given info will lead to a valid configuration of @ref CLDepthwiseConvolutionLayer3x3NCHWKernel
				54	*
				55	* @param[in] input Source tensor. DataType supported: F16/F32/QASYMM8.
				56	* @param[in] weights Weights tensor. A 3D tensor with dimensions [3, 3, IFM]. Data type supported: Same as @p input.
				57	* @param[in] biases Biases tensor. A 1D tensor with dimensions [IFM]. Must be nullptr if not needed.
				58	* Data type supported: Same as @p input.
				59	* @param[in] output Destination tensor. Data type supported: Same as @p input.
				60	* @param[in] conv_info Padding and stride information to use for the convolution.
				61	* @param[in] depth_multiplier (Optional) Multiplier to apply to the input's depth in order to retrieve the output's depth. Defaults to 1.
				62	* @param[in] act_info (Optional) Activation layer information in case of a fused activation. Only RELU, BOUNDED_RELU and LU_BOUNDED_RELU are supported.
				63	* @param[in] gpu_target (Optional) GPU target to validate the kernel for. Defaults to midgard.
				64	*
				65	* @return a status
				66	*/
				67	static Status validate(const ITensorInfo input, const ITensorInfo weights, const ITensorInfo biases, const ITensorInfo output, const PadStrideInfo &conv_info, unsigned int depth_multiplier,
				68	ActivationLayerInfo act_info = ActivationLayerInfo(), GPUTarget gpu_target = GPUTarget::MIDGARD);
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	69
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	70	void run(const Window &window, cl::CommandQueue &queue) override;
				71	BorderSize border_size() const override;
				72
				73	private:
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	74	unsigned int _conv_stride_x;
				75	unsigned int _conv_pad_top;
Giorgio Arena	fa23f11	2018-06-19 11:27:38 +0100	[diff] [blame]	76	unsigned int _conv_pad_left;
Giorgio Arena	93a690e	2017-08-01 16:09:33 +0100	[diff] [blame]	77	};
Gian Marco Iodice	f670a0a	2017-09-18 12:20:45 +0100	[diff] [blame]	78	} // namespace arm_compute
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	79	#endif /__ARM_COMPUTE_CLDEPTHWISECONVOLUTIONNCHWKERNEL3x3_H__ /