Blame - src/runtime/CL/functions/CLConvolutionLayer.cpp - ml/ComputeLibrary

blob: b295a274bd7aed9bfcb23b30f319ef93a3466c60 [file] [log] [blame]

Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	1	/*
Gian Marco Iodice	ff1fe3e	2021-01-02 09:58:51 +0000	[diff] [blame]	2	* Copyright (c) 2017-2021 Arm Limited.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	3	*
				4	* SPDX-License-Identifier: MIT
				5	*
				6	* Permission is hereby granted, free of charge, to any person obtaining a copy
				7	* of this software and associated documentation files (the "Software"), to
				8	* deal in the Software without restriction, including without limitation the
				9	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
				10	* sell copies of the Software, and to permit persons to whom the Software is
				11	* furnished to do so, subject to the following conditions:
				12	*
				13	* The above copyright notice and this permission notice shall be included in all
				14	* copies or substantial portions of the Software.
				15	*
				16	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				17	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				18	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
				19	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				20	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				21	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				22	* SOFTWARE.
				23	*/
				24	#include "arm_compute/runtime/CL/functions/CLConvolutionLayer.h"
				25
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	26	#include "arm_compute/core/CL/CLKernelLibrary.h"
				27	#include "arm_compute/core/CL/ICLTensor.h"
				28	#include "arm_compute/core/KernelDescriptors.h"
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	29	#include "arm_compute/core/utils/misc/ShapeCalculator.h"
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	30	#include "arm_compute/runtime/CL/functions/CLFFTConvolutionLayer.h"
				31	#include "src/core/CL/ICLKernel.h"
				32	#include "src/core/helpers/MemoryHelpers.h"
				33	#include "src/runtime/gpu/cl/operators/ClConv2d.h"
				34	#include "support/Cast.h"
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	35
Michele Di Giorgio	14cbfb2	2019-10-23 10:53:10 +0100	[diff] [blame]	36	namespace arm_compute
				37	{
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	38	using namespace arm_compute::misc::shape_calculator;
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	39	using namespace arm_compute::experimental;
				40	struct CLConvolutionLayer::Impl
				41	{
				42	MemoryGroup memory_group{};
				43	std::shared_ptr<IMemoryManager> memory_manager{};
				44	std::unique_ptr<opencl::IClOperator> op{ nullptr };
				45	ITensorPack run_pack{};
				46	ITensorPack prep_pack{};
				47	WorkspaceData<CLTensor> workspace{};
				48	experimental::MemoryRequirements aux_mem_req{};
				49	std::unique_ptr<IFunction> func{ nullptr };
				50	};
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	51
Georgios Pinitas	baf174e	2017-09-08 19:47:30 +0100	[diff] [blame]	52	CLConvolutionLayer::CLConvolutionLayer(std::shared_ptr<IMemoryManager> memory_manager)
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	53	: _impl(std::make_unique<Impl>())
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	54	{
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	55	_impl->memory_manager = std::move(memory_manager);
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	56	}
				57
Sang-Hoon Park	bef7fa2	2020-10-21 15:58:54 +0100	[diff] [blame]	58	CLConvolutionLayer::~CLConvolutionLayer() = default;
				59
Alex Gilday	7da29b6	2018-03-23 14:16:00 +0000	[diff] [blame]	60	void CLConvolutionLayer::configure(ICLTensor input, const ICLTensor weights, const ICLTensor biases, ICLTensor output, const PadStrideInfo &conv_info, const WeightsInfo &weights_info,
Gian Marco Iodice	916d1bc	2018-08-13 11:20:41 +0100	[diff] [blame]	61	const Size2D &dilation, const ActivationLayerInfo &act_info, bool enable_fast_math, unsigned int num_groups)
Chunosov	5124be5	2017-11-22 20:42:13 +0700	[diff] [blame]	62	{
Manuel Bottini	2b84be5	2020-04-08 10:15:51 +0100	[diff] [blame]	63	configure(CLKernelLibrary::get().get_compile_context(), input, weights, biases, output, conv_info, weights_info, dilation, act_info, enable_fast_math, num_groups);
				64	}
				65
				66	void CLConvolutionLayer::configure(const CLCompileContext &compile_context, ICLTensor input, const ICLTensor weights, const ICLTensor biases, ICLTensor output, const PadStrideInfo &conv_info,
				67	const WeightsInfo &weights_info,
				68	const Size2D &dilation, const ActivationLayerInfo &act_info, bool enable_fast_math, unsigned int num_groups)
				69	{
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	70	ARM_COMPUTE_ERROR_ON_NULLPTR(input, weights, output);
Gian Marco Iodice	2213d4b	2018-04-27 10:39:06 +0100	[diff] [blame]	71	ARM_COMPUTE_ERROR_THROW_ON(CLConvolutionLayer::validate(input->info(), weights->info(), ((biases != nullptr) ? biases->info() : nullptr), output->info(), conv_info, weights_info, dilation, act_info,
Gian Marco Iodice	916d1bc	2018-08-13 11:20:41 +0100	[diff] [blame]	72	enable_fast_math, num_groups));
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	73
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	74	const Conv2dInfo conv2d_info = Conv2dInfo(conv_info, dilation, act_info, enable_fast_math, num_groups);
				75
				76	switch(opencl::ClConv2d::get_convolution_method(input->info(), weights->info(), output->info(), conv2d_info,
				77	weights_info, CLScheduler::get().target()))
Chunosov	5124be5	2017-11-22 20:42:13 +0700	[diff] [blame]	78	{
Gian Marco Iodice	e52a300	2018-04-11 15:59:10 +0100	[diff] [blame]	79	case ConvolutionMethod::WINOGRAD:
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	80	case ConvolutionMethod::DIRECT:
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	81	case ConvolutionMethod::GEMM:
Gian Marco	20d7848	2018-01-11 15:10:58 +0000	[diff] [blame]	82	{
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	83	auto f = std::make_unique<opencl::ClConv2d>();
				84	f->configure(compile_context, input->info(), weights->info(), ((biases != nullptr) ? biases->info() : nullptr), output->info(), conv2d_info, weights_info);
				85	_impl->op = std::move(f);
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	86	break;
Gian Marco	20d7848	2018-01-11 15:10:58 +0000	[diff] [blame]	87	}
Vidhya Sudhan Loganathan	8ec0bb6	2019-04-23 10:40:44 +0100	[diff] [blame]	88	case ConvolutionMethod::FFT:
				89	{
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	90	auto f = std::make_unique<CLFFTConvolutionLayer>(_impl->memory_manager);
Giorgio Arena	ea7de7b	2020-12-10 16:49:39 +0000	[diff] [blame]	91	f->configure(compile_context, input, weights, biases, output, conv_info, act_info, enable_fast_math);
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	92	_impl->func = std::move(f);
Vidhya Sudhan Loganathan	8ec0bb6	2019-04-23 10:40:44 +0100	[diff] [blame]	93	break;
				94	}
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	95	default:
				96	ARM_COMPUTE_ERROR("Not supported.");
				97	break;
Chunosov	5124be5	2017-11-22 20:42:13 +0700	[diff] [blame]	98	}
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	99
				100	if(_impl->op)
				101	{
				102	_impl->memory_group = MemoryGroup(std::move(_impl->memory_manager));
				103	_impl->aux_mem_req = _impl->op->workspace();
				104	_impl->run_pack = { { ACL_SRC_0, input }, { ACL_SRC_1, weights }, { ACL_SRC_2, biases }, { ACL_DST, output } };
				105	_impl->prep_pack = { { ACL_SRC_1, weights }, { ACL_SRC_2, biases } };
				106	_impl->workspace = manage_workspace<CLTensor>(_impl->aux_mem_req, _impl->memory_group, _impl->run_pack, _impl->prep_pack);
				107	}
Chunosov	5124be5	2017-11-22 20:42:13 +0700	[diff] [blame]	108	}
				109
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	110	Status CLConvolutionLayer::validate(const ITensorInfo input, const ITensorInfo weights, const ITensorInfo biases, const ITensorInfo output, const PadStrideInfo &conv_info,
Gian Marco Iodice	916d1bc	2018-08-13 11:20:41 +0100	[diff] [blame]	111	const WeightsInfo &weights_info, const Size2D &dilation, const ActivationLayerInfo &act_info, bool enable_fast_math, unsigned int num_groups)
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	112	{
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	113	ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR(input, weights, output);
Gian Marco Iodice	916d1bc	2018-08-13 11:20:41 +0100	[diff] [blame]	114	ARM_COMPUTE_RETURN_ERROR_ON_MSG((num_groups != 1) && (input->data_layout() != DataLayout::NCHW), "Grouping (num_groups != 1) with NHWC data layout is not supported");
Chunosov	5124be5	2017-11-22 20:42:13 +0700	[diff] [blame]	115
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	116	const GPUTarget gpu_target = CLScheduler::get().target();
				117	const Conv2dInfo conv2d_info = Conv2dInfo(conv_info, dilation, act_info, enable_fast_math, num_groups);
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	118
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	119	switch(opencl::ClConv2d::get_convolution_method(input, weights, output, conv2d_info, weights_info, gpu_target))
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	120	{
Gian Marco Iodice	e52a300	2018-04-11 15:59:10 +0100	[diff] [blame]	121	case ConvolutionMethod::WINOGRAD:
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	122	case ConvolutionMethod::DIRECT:
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	123	case ConvolutionMethod::GEMM:
Chunosov	5124be5	2017-11-22 20:42:13 +0700	[diff] [blame]	124	{
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	125	ARM_COMPUTE_RETURN_ON_ERROR(opencl::ClConv2d::validate(input, weights, biases, output, conv2d_info, weights_info));
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	126	break;
Chunosov	5124be5	2017-11-22 20:42:13 +0700	[diff] [blame]	127	}
Vidhya Sudhan Loganathan	8ec0bb6	2019-04-23 10:40:44 +0100	[diff] [blame]	128	case ConvolutionMethod::FFT:
				129	{
				130	// Validate FFT-based convolution layer
Giorgio Arena	ea7de7b	2020-12-10 16:49:39 +0000	[diff] [blame]	131	ARM_COMPUTE_RETURN_ON_ERROR(CLFFTConvolutionLayer::validate(input, weights, nullptr, output, conv_info, act_info, enable_fast_math));
Vidhya Sudhan Loganathan	8ec0bb6	2019-04-23 10:40:44 +0100	[diff] [blame]	132	break;
				133	}
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	134	default:
				135	ARM_COMPUTE_ERROR("Not supported.");
				136	break;
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	137	}
				138
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	139	return Status{};
				140	}
Gian Marco Iodice	368da83	2017-07-03 12:33:49 +0100	[diff] [blame]	141
Gian Marco Iodice	e52a300	2018-04-11 15:59:10 +0100	[diff] [blame]	142	ConvolutionMethod CLConvolutionLayer::get_convolution_method(const ITensorInfo input, const ITensorInfo weights, const ITensorInfo *output, const PadStrideInfo &conv_info,
Gian Marco Iodice	2213d4b	2018-04-27 10:39:06 +0100	[diff] [blame]	143	const WeightsInfo &weights_info, const ActivationLayerInfo &act_info, const GPUTarget gpu_target, const Size2D &dilation, bool enable_fast_math)
Isabella Gottardi	f07d28d	2018-02-06 14:52:43 +0000	[diff] [blame]	144	{
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	145	const Conv2dInfo conv2d_info = Conv2dInfo(conv_info, dilation, act_info, enable_fast_math, 1);
				146	return opencl::ClConv2d::get_convolution_method(input, weights, output, conv2d_info, weights_info, gpu_target);
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	147	}
				148
				149	void CLConvolutionLayer::run()
				150	{
Georgios Pinitas	e043767	2018-05-02 14:07:55 +0100	[diff] [blame]	151	prepare();
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	152
				153	MemoryGroupResourceScope scope_mg(_impl->memory_group);
				154
				155	if(_impl->func)
				156	{
				157	_impl->func->run();
				158	}
				159	else
				160	{
				161	_impl->op->run(_impl->run_pack);
				162	}
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	163	}
Georgios Pinitas	e043767	2018-05-02 14:07:55 +0100	[diff] [blame]	164
				165	void CLConvolutionLayer::prepare()
				166	{
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	167	if(_impl->func)
				168	{
				169	_impl->func->prepare();
				170	}
				171	else
				172	{
				173	_impl->op->prepare(_impl->prep_pack);
				174
				175	// Release temporary tensors that are only used in prepare stage
				176	release_temporaries(_impl->aux_mem_req, _impl->workspace);
				177	}
Georgios Pinitas	e043767	2018-05-02 14:07:55 +0100	[diff] [blame]	178	}
Sheri Zhang	06d1efd	2021-07-28 11:20:04 +0100	[diff] [blame]	179	} // namespace arm_compute