Blame - arm_compute/core/Helpers.h - ml/ComputeLibrary

blob: 8f4220fb809cbee344af506abd2248aacdb07cad [file] [log] [blame]

Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	1	/*
Diego Lopez Recas	35ceeb2	2017-12-04 18:56:10 +0000	[diff] [blame]	2	* Copyright (c) 2016-2018 ARM Limited.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	3	*
				4	* SPDX-License-Identifier: MIT
				5	*
				6	* Permission is hereby granted, free of charge, to any person obtaining a copy
				7	* of this software and associated documentation files (the "Software"), to
				8	* deal in the Software without restriction, including without limitation the
				9	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
				10	* sell copies of the Software, and to permit persons to whom the Software is
				11	* furnished to do so, subject to the following conditions:
				12	*
				13	* The above copyright notice and this permission notice shall be included in all
				14	* copies or substantial portions of the Software.
				15	*
				16	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				17	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				18	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
				19	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				20	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				21	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				22	* SOFTWARE.
				23	*/
				24	#ifndef __ARM_COMPUTE_HELPERS_H__
				25	#define __ARM_COMPUTE_HELPERS_H__
				26
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	27	#include "arm_compute/core/Coordinates.h"
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	28	#include "arm_compute/core/Error.h"
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	29	#include "arm_compute/core/IAccessWindow.h"
				30	#include "arm_compute/core/Steps.h"
				31	#include "arm_compute/core/Strides.h"
				32	#include "arm_compute/core/TensorShape.h"
				33	#include "arm_compute/core/Types.h"
				34	#include "arm_compute/core/Window.h"
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	35
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	36	#include <array>
				37	#include <cstddef>
				38	#include <cstdint>
				39	#include <memory>
				40	#include <tuple>
				41	#include <type_traits>
				42	#include <utility>
				43
				44	namespace arm_compute
				45	{
				46	class IKernel;
				47	class ITensor;
				48	class ITensorInfo;
				49
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	50	/** Disable bitwise operations by default */
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	51	template <typename T>
				52	struct enable_bitwise_ops
				53	{
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	54	static constexpr bool value = false; /*< Disabled /
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	55	};
				56
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	57	#ifndef DOXYGEN_SKIP_THIS
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	58	template <typename T>
				59	typename std::enable_if<enable_bitwise_ops<T>::value, T>::type operator&(T lhs, T rhs)
				60	{
				61	using underlying_type = typename std::underlying_type<T>::type;
				62	return static_cast<T>(static_cast<underlying_type>(lhs) & static_cast<underlying_type>(rhs));
				63	}
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	64	#endif /* DOXYGEN_SKIP_THIS */
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	65
Michele Di Giorgio	b8fc60f	2018-04-25 11:58:07 +0100	[diff] [blame]	66	/** Helper function to create and return a unique_ptr pointed to a CL/GLES kernel object
				67	* It also calls the kernel's configuration.
				68	*
				69	* @param[in] args All the arguments that need pass to kernel's configuration.
				70	*
				71	* @return A unique pointer pointed to a CL/GLES kernel object
				72	*/
				73	template <typename Kernel, typename... T>
				74	std::unique_ptr<Kernel> create_configure_kernel(T &&... args)
				75	{
				76	std::unique_ptr<Kernel> k = arm_compute::support::cpp14::make_unique<Kernel>();
				77	k->configure(std::forward<T>(args)...);
				78	return k;
				79	}
				80
				81	/** Helper function to create and return a unique_ptr pointed to a CL/GLES kernel object
				82	*
				83	* @return A unique pointer pointed to a Kernel kernel object
				84	*/
				85	template <typename Kernel>
				86	std::unique_ptr<Kernel> create_kernel()
				87	{
				88	std::unique_ptr<Kernel> k = arm_compute::support::cpp14::make_unique<Kernel>();
				89	return k;
				90	}
				91
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	92	namespace traits
				93	{
				94	/** Check if a type T is contained in a tuple Tuple of types */
				95	template <typename T, typename Tuple>
				96	struct is_contained;
				97
				98	template <typename T>
				99	struct is_contained<T, std::tuple<>> : std::false_type
				100	{
				101	};
				102
				103	template <typename T, typename... Ts>
				104	struct is_contained<T, std::tuple<T, Ts...>> : std::true_type
				105	{
				106	};
				107
				108	template <typename T, typename U, typename... Ts>
				109	struct is_contained<T, std::tuple<U, Ts...>> : is_contained<T, std::tuple<Ts...>>
				110	{
				111	};
				112	}
				113
				114	/** Computes bilinear interpolation using the pointer to the top-left pixel and the pixel's distance between
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	115	* the real coordinates and the smallest following integer coordinates. Input must be in single channel format.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	116	*
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	117	* @param[in] pixel_ptr Pointer to the top-left pixel value of a single channel input.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	118	* @param[in] stride Stride to access the bottom-left and bottom-right pixel values
				119	* @param[in] dx Pixel's distance between the X real coordinate and the smallest X following integer
				120	* @param[in] dy Pixel's distance between the Y real coordinate and the smallest Y following integer
				121	*
				122	* @note dx and dy must be in the range [0, 1.0]
				123	*
				124	* @return The bilinear interpolated pixel value
				125	*/
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	126	template <typename T>
				127	inline T delta_bilinear_c1(const T *pixel_ptr, size_t stride, float dx, float dy)
				128	{
				129	ARM_COMPUTE_ERROR_ON(pixel_ptr == nullptr);
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	130
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	131	const float dx1 = 1.0f - dx;
				132	const float dy1 = 1.0f - dy;
				133
				134	const T a00 = *pixel_ptr;
				135	const T a01 = *(pixel_ptr + 1);
				136	const T a10 = *(pixel_ptr + stride);
				137	const T a11 = *(pixel_ptr + stride + 1);
				138
				139	const float w1 = dx1 * dy1;
				140	const float w2 = dx * dy1;
				141	const float w3 = dx1 * dy;
				142	const float w4 = dx * dy;
				143
				144	return static_cast<T>(a00 * w1 + a01 * w2 + a10 * w3 + a11 * w4);
				145	}
				146
Anthony Barbier	9a33b54	2017-12-12 22:08:59 +0000	[diff] [blame]	147	/** Computes linear interpolation using the pointer to the top pixel and the pixel's distance between
				148	* the real coordinates and the smallest following integer coordinates. Input must be in single channel format.
				149	*
				150	* @param[in] pixel_ptr Pointer to the top pixel value of a single channel input.
				151	* @param[in] stride Stride to access the bottom pixel value
				152	* @param[in] dy Pixel's distance between the Y real coordinate and the smallest Y following integer
				153	*
				154	* @note dy must be in the range [0, 1.0]
				155	*
				156	* @return The linear interpolated pixel value
				157	*/
				158	template <typename T>
				159	inline T delta_linear_c1_y(const T *pixel_ptr, size_t stride, float dy)
				160	{
				161	ARM_COMPUTE_ERROR_ON(pixel_ptr == nullptr);
				162
				163	const float dy1 = 1.0f - dy;
				164
				165	const T a00 = *pixel_ptr;
				166	const T a10 = *(pixel_ptr + stride);
				167
				168	const float w1 = dy1;
				169	const float w3 = dy;
				170
				171	return static_cast<T>(a00 * w1 + a10 * w3);
				172	}
				173	/** Computes linear interpolation using the pointer to the left pixel and the pixel's distance between
				174	* the real coordinates and the smallest following integer coordinates. Input must be in single channel format.
				175	*
				176	* @param[in] pixel_ptr Pointer to the left pixel value of a single channel input.
				177	* @param[in] dx Pixel's distance between the X real coordinate and the smallest X following integer
				178	*
				179	* @note dx must be in the range [0, 1.0]
				180	*
				181	* @return The linear interpolated pixel value
				182	*/
				183	template <typename T>
				184	inline T delta_linear_c1_x(const T *pixel_ptr, float dx)
				185	{
				186	ARM_COMPUTE_ERROR_ON(pixel_ptr == nullptr);
				187
				188	const T a00 = *pixel_ptr;
				189	const T a01 = *(pixel_ptr + 1);
				190
				191	const float dx1 = 1.0f - dx;
				192
				193	const float w1 = dx1;
				194	const float w2 = dx;
				195
				196	return static_cast<T>(a00 * w1 + a01 * w2);
				197	}
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	198	/** Return the pixel at (x,y) using bilinear interpolation.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	199	*
				200	* @warning Only works if the iterator was created with an IImage
				201	*
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	202	* @param[in] first_pixel_ptr Pointer to the first pixel of a single channel input.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	203	* @param[in] stride Stride in bytes of the image;
				204	* @param[in] x X position of the wanted pixel
				205	* @param[in] y Y position of the wanted pixel
				206	*
				207	* @return The pixel at (x, y) using bilinear interpolation.
				208	*/
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	209	template <typename T>
				210	inline T pixel_bilinear_c1(const T *first_pixel_ptr, size_t stride, float x, float y)
				211	{
				212	ARM_COMPUTE_ERROR_ON(first_pixel_ptr == nullptr);
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	213
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	214	const int32_t xi = std::floor(x);
				215	const int32_t yi = std::floor(y);
				216
				217	const float dx = x - xi;
				218	const float dy = y - yi;
				219
				220	return delta_bilinear_c1(first_pixel_ptr + xi + yi * stride, stride, dx, dy);
				221	}
				222
				223	/** Return the pixel at (x,y) using bilinear interpolation by clamping when out of borders. The image must be single channel input
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	224	*
				225	* @warning Only works if the iterator was created with an IImage
				226	*
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	227	* @param[in] first_pixel_ptr Pointer to the first pixel of a single channel image.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	228	* @param[in] stride Stride in bytes of the image
				229	* @param[in] width Width of the image
				230	* @param[in] height Height of the image
				231	* @param[in] x X position of the wanted pixel
				232	* @param[in] y Y position of the wanted pixel
				233	*
				234	* @return The pixel at (x, y) using bilinear interpolation.
				235	*/
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	236	template <typename T>
				237	inline uint8_t pixel_bilinear_c1_clamp(const T *first_pixel_ptr, size_t stride, size_t width, size_t height, float x, float y)
				238	{
				239	ARM_COMPUTE_ERROR_ON(first_pixel_ptr == nullptr);
				240
				241	x = std::max(-1.f, std::min(x, static_cast<float>(width)));
				242	y = std::max(-1.f, std::min(y, static_cast<float>(height)));
				243
				244	const float xi = std::floor(x);
				245	const float yi = std::floor(y);
				246
				247	const float dx = x - xi;
				248	const float dy = y - yi;
				249
Anthony Barbier	9a33b54	2017-12-12 22:08:59 +0000	[diff] [blame]	250	if(dx == 0.0f)
				251	{
				252	if(dy == 0.0f)
				253	{
				254	return static_cast<T>(first_pixel_ptr[static_cast<int32_t>(xi) + static_cast<int32_t>(yi) * stride]);
				255	}
				256	return delta_linear_c1_y(first_pixel_ptr + static_cast<int32_t>(xi) + static_cast<int32_t>(yi) * stride, stride, dy);
				257	}
				258	if(dy == 0.0f)
				259	{
				260	return delta_linear_c1_x(first_pixel_ptr + static_cast<int32_t>(xi) + static_cast<int32_t>(yi) * stride, dx);
				261	}
Georgios Pinitas	583137c	2017-08-31 18:12:42 +0100	[diff] [blame]	262	return delta_bilinear_c1(first_pixel_ptr + static_cast<int32_t>(xi) + static_cast<int32_t>(yi) * stride, stride, dx, dy);
				263	}
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	264
				265	/** Return the pixel at (x,y) using area interpolation by clamping when out of borders. The image must be single channel U8
				266	*
				267	* @note The interpolation area depends on the width and height ration of the input and output images
				268	* @note Currently average of the contributing pixels is calculated
				269	*
				270	* @param[in] first_pixel_ptr Pointer to the first pixel of a single channel U8 image.
				271	* @param[in] stride Stride in bytes of the image
				272	* @param[in] width Width of the image
				273	* @param[in] height Height of the image
				274	* @param[in] wr Width ratio among the input image width and output image width.
				275	* @param[in] hr Height ratio among the input image height and output image height.
				276	* @param[in] x X position of the wanted pixel
				277	* @param[in] y Y position of the wanted pixel
				278	*
				279	* @return The pixel at (x, y) using area interpolation.
				280	*/
				281	inline uint8_t pixel_area_c1u8_clamp(const uint8_t *first_pixel_ptr, size_t stride, size_t width, size_t height, float wr, float hr, int x, int y);
				282
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	283	/** Iterator updated by @ref execute_window_loop for each window element */
				284	class Iterator
				285	{
				286	public:
				287	/** Default constructor to create an empty iterator */
				288	constexpr Iterator();
				289	/** Create a container iterator for the metadata and allocation contained in the ITensor
				290	*
				291	* @param[in] tensor The tensor to associate to the iterator.
				292	* @param[in] window The window which will be used to iterate over the tensor.
				293	*/
				294	Iterator(const ITensor *tensor, const Window &window);
				295
				296	/** Increment the iterator along the specified dimension of the step value associated to the dimension.
				297	*
				298	* @warning It is the caller's responsibility to call increment(dimension+1) when reaching the end of a dimension, the iterator will not check for overflow.
				299	*
				300	* @note When incrementing a dimension 'n' the coordinates of all the dimensions in the range (0,n-1) are reset. For example if you iterate over a 2D image, everytime you change row (dimension 1), the iterator for the width (dimension 0) is reset to its start.
				301	*
				302	* @param[in] dimension Dimension to increment
				303	*/
				304	void increment(size_t dimension);
				305
				306	/** Return the offset in bytes from the first element to the current position of the iterator
				307	*
				308	* @return The current position of the iterator in bytes relative to the first element.
				309	*/
				310	constexpr int offset() const;
				311
				312	/** Return a pointer to the current pixel.
				313	*
				314	* @warning Only works if the iterator was created with an ITensor.
				315	*
				316	* @return equivalent to buffer() + offset()
				317	*/
				318	constexpr uint8_t *ptr() const;
				319
				320	/** Move the iterator back to the beginning of the specified dimension.
				321	*
				322	* @param[in] dimension Dimension to reset
				323	*/
				324	void reset(size_t dimension);
				325
				326	private:
				327	uint8_t *_ptr;
				328
				329	class Dimension
				330	{
				331	public:
				332	constexpr Dimension()
				333	: _dim_start(0), _stride(0)
				334	{
				335	}
				336
				337	int _dim_start;
				338	int _stride;
				339	};
				340
				341	std::array<Dimension, Coordinates::num_max_dimensions> _dims;
				342	};
				343
				344	/** Iterate through the passed window, automatically adjusting the iterators and calling the lambda_functino for each element.
				345	* It passes the x and y positions to the lambda_function for each iteration
				346	*
				347	* @param[in] w Window to iterate through.
				348	* @param[in] lambda_function The function of type void(function)( const Coordinates & id ) to call at each iteration.
				349	* Where id represents the absolute coordinates of the item to process.
				350	* @param[in,out] iterators Tensor iterators which will be updated by this function before calling lambda_function.
				351	*/
				352	template <typename L, typename... Ts>
				353	inline void execute_window_loop(const Window &w, L &&lambda_function, Ts &&... iterators);
				354
				355	/** Update window and padding size for each of the access patterns.
				356	*
				357	* First the window size is reduced based on all access patterns that are not
				358	* allowed to modify the padding of the underlying tensor. Then the padding of
				359	* the remaining tensors is increased to match the window.
				360	*
				361	* @param[in] win Window that is used by the kernel.
				362	* @param[in] patterns Access patterns used to calculate the final window and padding.
				363	*
				364	* @return True if the window has been changed. Changes to the padding do not
				365	* influence the returned value.
				366	*/
				367	template <typename... Ts>
				368	bool update_window_and_padding(Window &win, Ts &&... patterns)
				369	{
				370	bool window_changed = false;
				371
Diego Lopez Recas	490b3d8	2017-12-19 15:42:25 +0000	[diff] [blame]	372	utility::for_each([&](const IAccessWindow & w)
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	373	{
				374	window_changed \|= w.update_window_if_needed(win);
				375	},
				376	patterns...);
				377
				378	bool padding_changed = false;
				379
Diego Lopez Recas	35ceeb2	2017-12-04 18:56:10 +0000	[diff] [blame]	380	utility::for_each([&](IAccessWindow & w)
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	381	{
				382	padding_changed \|= w.update_padding_if_needed(win);
				383	},
				384	patterns...);
				385
				386	return window_changed;
				387	}
				388
				389	/** Calculate the maximum window for a given tensor shape and border setting
				390	*
Diego Lopez Recas	bcbc970	2017-12-18 11:28:27 +0000	[diff] [blame]	391	* @param[in] valid_region Valid region object defining the shape of the tensor space for which the window is created.
				392	* @param[in] steps (Optional) Number of elements processed for each step.
				393	* @param[in] skip_border (Optional) If true exclude the border region from the window.
				394	* @param[in] border_size (Optional) Border size.
				395	*
				396	* @return The maximum window the kernel can be executed on.
				397	*/
				398	Window calculate_max_window(const ValidRegion &valid_region, const Steps &steps = Steps(), bool skip_border = false, BorderSize border_size = BorderSize());
				399
				400	/** Calculate the maximum window for a given tensor shape and border setting
				401	*
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	402	* @param[in] info Tensor info object defining the shape of the object for which the window is created.
				403	* @param[in] steps (Optional) Number of elements processed for each step.
				404	* @param[in] skip_border (Optional) If true exclude the border region from the window.
				405	* @param[in] border_size (Optional) Border size.
				406	*
				407	* @return The maximum window the kernel can be executed on.
				408	*/
Diego Lopez Recas	bcbc970	2017-12-18 11:28:27 +0000	[diff] [blame]	409	inline Window calculate_max_window(const ITensorInfo &info, const Steps &steps = Steps(), bool skip_border = false, BorderSize border_size = BorderSize())
				410	{
				411	return calculate_max_window(info.valid_region(), steps, skip_border, border_size);
				412	}
				413
				414	/** Calculate the maximum window used by a horizontal kernel for a given tensor shape and border setting
				415	*
				416	* @param[in] valid_region Valid region object defining the shape of the tensor space for which the window is created.
				417	* @param[in] steps (Optional) Number of elements processed for each step.
				418	* @param[in] skip_border (Optional) If true exclude the border region from the window.
				419	* @param[in] border_size (Optional) Border size. The border region will be excluded from the window.
				420	*
				421	* @return The maximum window the kernel can be executed on.
				422	*/
				423	Window calculate_max_window_horizontal(const ValidRegion &valid_region, const Steps &steps = Steps(), bool skip_border = false, BorderSize border_size = BorderSize());
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	424
				425	/** Calculate the maximum window used by a horizontal kernel for a given tensor shape and border setting
				426	*
				427	* @param[in] info Tensor info object defining the shape of the object for which the window is created.
				428	* @param[in] steps (Optional) Number of elements processed for each step.
				429	* @param[in] skip_border (Optional) If true exclude the border region from the window.
Diego Lopez Recas	bcbc970	2017-12-18 11:28:27 +0000	[diff] [blame]	430	* @param[in] border_size (Optional) Border size.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	431	*
				432	* @return The maximum window the kernel can be executed on.
				433	*/
Diego Lopez Recas	bcbc970	2017-12-18 11:28:27 +0000	[diff] [blame]	434	inline Window calculate_max_window_horizontal(const ITensorInfo &info, const Steps &steps = Steps(), bool skip_border = false, BorderSize border_size = BorderSize())
				435	{
				436	return calculate_max_window_horizontal(info.valid_region(), steps, skip_border, border_size);
				437	}
				438
				439	/** Calculate the maximum window for a given tensor shape and border setting. The window will also includes the border.
				440	*
				441	* @param[in] valid_region Valid region object defining the shape of the tensor space for which the window is created.
				442	* @param[in] steps (Optional) Number of elements processed for each step.
				443	* @param[in] border_size (Optional) Border size. The border region will be included in the window.
				444	*
				445	* @return The maximum window the kernel can be executed on.
				446	*/
				447	Window calculate_max_enlarged_window(const ValidRegion &valid_region, const Steps &steps = Steps(), BorderSize border_size = BorderSize());
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	448
				449	/** Calculate the maximum window for a given tensor shape and border setting. The window will also includes the border.
				450	*
				451	* @param[in] info Tensor info object defining the shape of the object for which the window is created.
				452	* @param[in] steps (Optional) Number of elements processed for each step.
				453	* @param[in] border_size (Optional) Border size. The border region will be included in the window.
				454	*
				455	* @return The maximum window the kernel can be executed on.
				456	*/
Diego Lopez Recas	bcbc970	2017-12-18 11:28:27 +0000	[diff] [blame]	457	inline Window calculate_max_enlarged_window(const ITensorInfo &info, const Steps &steps = Steps(), BorderSize border_size = BorderSize())
				458	{
				459	return calculate_max_enlarged_window(info.valid_region(), steps, border_size);
				460	}
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	461
				462	/** Intersect multiple valid regions.
				463	*
				464	* @param[in] regions Valid regions.
				465	*
				466	* @return Intersection of all regions.
				467	*/
				468	template <typename... Ts>
Diego Lopez Recas	490b3d8	2017-12-19 15:42:25 +0000	[diff] [blame]	469	ValidRegion intersect_valid_regions(const Ts &... regions)
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	470	{
				471	auto intersect = [](const ValidRegion & r1, const ValidRegion & r2) -> ValidRegion
				472	{
				473	ValidRegion region;
				474
				475	for(size_t d = 0; d < std::min(r1.anchor.num_dimensions(), r2.anchor.num_dimensions()); ++d)
				476	{
				477	region.anchor.set(d, std::max(r1.anchor[d], r2.anchor[d]));
				478	}
				479
				480	for(size_t d = 0; d < std::min(r1.shape.num_dimensions(), r2.shape.num_dimensions()); ++d)
				481	{
				482	region.shape.set(d, std::min(r1.shape[d], r2.shape[d]));
				483	}
				484
				485	return region;
				486	};
				487
Diego Lopez Recas	490b3d8	2017-12-19 15:42:25 +0000	[diff] [blame]	488	return utility::foldl(intersect, regions...);
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	489	}
				490
				491	/** Create a strides object based on the provided strides and the tensor dimensions.
				492	*
				493	* @param[in] info Tensor info object providing the shape of the tensor for unspecified strides.
				494	* @param[in] stride_x Stride to be used in X dimension (in bytes).
				495	* @param[in] fixed_strides Strides to be used in higher dimensions starting at Y (in bytes).
				496	*
				497	* @return Strides object based on the specified strides. Missing strides are
				498	* calculated based on the tensor shape and the strides of lower dimensions.
				499	*/
				500	template <typename T, typename... Ts>
				501	inline Strides compute_strides(const ITensorInfo &info, T stride_x, Ts &&... fixed_strides)
				502	{
				503	const TensorShape &shape = info.tensor_shape();
				504
				505	// Create strides object
				506	Strides strides(stride_x, fixed_strides...);
				507
				508	for(size_t i = 1 + sizeof...(Ts); i < info.num_dimensions(); ++i)
				509	{
				510	strides.set(i, shape[i - 1] * strides[i - 1]);
				511	}
				512
				513	return strides;
				514	}
				515
				516	/** Create a strides object based on the tensor dimensions.
				517	*
				518	* @param[in] info Tensor info object used to compute the strides.
				519	*
				520	* @return Strides object based on element size and tensor shape.
				521	*/
				522	template <typename... Ts>
				523	inline Strides compute_strides(const ITensorInfo &info)
				524	{
				525	return compute_strides(info, info.element_size());
				526	}
				527
Georgios Pinitas	8795ffb	2017-12-01 16:13:40 +0000	[diff] [blame]	528	/** Permutes given Dimensions according to a permutation vector
				529	*
				530	* @warning Validity of permutation is not checked
				531	*
				532	* @param[in, out] dimensions Dimensions to permute
				533	* @param[in] perm Permutation vector
				534	*/
				535	template <typename T>
				536	inline void permute(Dimensions<T> &dimensions, const PermutationVector &perm)
				537	{
Georgios Pinitas	69af6cf	2018-02-14 19:23:44 +0000	[diff] [blame]	538	auto dimensions_copy = utility::make_array<Dimensions<T>::num_max_dimensions>(dimensions.begin(), dimensions.end());
Georgios Pinitas	8795ffb	2017-12-01 16:13:40 +0000	[diff] [blame]	539	for(unsigned int i = 0; i < perm.num_dimensions(); ++i)
				540	{
Georgios Pinitas	69af6cf	2018-02-14 19:23:44 +0000	[diff] [blame]	541	T dimension_val = (perm[i] < dimensions.num_dimensions()) ? dimensions_copy[perm[i]] : 0;
				542	dimensions.set(i, dimension_val);
				543	}
				544	}
				545
				546	/** Permutes given TensorShape according to a permutation vector
				547	*
				548	* @warning Validity of permutation is not checked
				549	*
				550	* @param[in, out] shape Shape to permute
				551	* @param[in] perm Permutation vector
				552	*/
				553	inline void permute(TensorShape &shape, const PermutationVector &perm)
				554	{
Giorgio Arena	563494c	2018-04-30 17:29:41 +0100	[diff] [blame]	555	TensorShape shape_copy = shape;
Georgios Pinitas	69af6cf	2018-02-14 19:23:44 +0000	[diff] [blame]	556	for(unsigned int i = 0; i < perm.num_dimensions(); ++i)
				557	{
				558	size_t dimension_val = (perm[i] < shape.num_dimensions()) ? shape_copy[perm[i]] : 1;
Giorgio Arena	563494c	2018-04-30 17:29:41 +0100	[diff] [blame]	559	shape.set(i, dimension_val, false); // Avoid changes in _num_dimension
Georgios Pinitas	8795ffb	2017-12-01 16:13:40 +0000	[diff] [blame]	560	}
				561	}
				562
Vidhya Sudhan Loganathan	7485d5a	2018-07-04 09:34:00 +0100	[diff] [blame]	563	/** Auto initialize the tensor info (shape, number of channels and data type) if the current assignment is empty.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	564	*
Vidhya Sudhan Loganathan	7485d5a	2018-07-04 09:34:00 +0100	[diff] [blame]	565	* @param[in,out] info Tensor info used to check and assign.
				566	* @param[in] shape New shape.
				567	* @param[in] num_channels New number of channels.
				568	* @param[in] data_type New data type
				569	* @param[in] quantization_info (Optional) New quantization info
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	570	*
				571	* @return True if the tensor info has been initialized
				572	*/
Georgios Pinitas	05078ec	2017-11-02 13:06:59 +0000	[diff] [blame]	573	bool auto_init_if_empty(ITensorInfo &info,
				574	const TensorShape &shape,
				575	int num_channels, DataType data_type,
Georgios Pinitas	05078ec	2017-11-02 13:06:59 +0000	[diff] [blame]	576	QuantizationInfo quantization_info = QuantizationInfo());
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	577
Georgios Pinitas	283c179	2017-11-10 18:14:06 +0000	[diff] [blame]	578	/** Auto initialize the tensor info using another tensor info.
				579	*
				580	* @param info_sink Tensor info used to check and assign
				581	* @param info_source Tensor info used to assign
				582	*
				583	* @return True if the tensor info has been initialized
				584	*/
Pablo Palmier	a2b89ca	2017-10-05 15:01:34 +0100	[diff] [blame]	585	bool auto_init_if_empty(ITensorInfo &info_sink, const ITensorInfo &info_source);
Georgios Pinitas	283c179	2017-11-10 18:14:06 +0000	[diff] [blame]	586
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	587	/** Set the shape to the specified value if the current assignment is empty.
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	588	*
				589	* @param[in,out] info Tensor info used to check and assign.
				590	* @param[in] shape New shape.
				591	*
				592	* @return True if the shape has been changed.
				593	*/
				594	bool set_shape_if_empty(ITensorInfo &info, const TensorShape &shape);
				595
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	596	/** Set the format, data type and number of channels to the specified value if
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	597	* the current data type is unknown.
				598	*
				599	* @param[in,out] info Tensor info used to check and assign.
				600	* @param[in] format New format.
				601	*
				602	* @return True if the format has been changed.
				603	*/
				604	bool set_format_if_unknown(ITensorInfo &info, Format format);
				605
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	606	/** Set the data type and number of channels to the specified value if
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	607	* the current data type is unknown.
				608	*
				609	* @param[in,out] info Tensor info used to check and assign.
				610	* @param[in] data_type New data type.
				611	*
				612	* @return True if the data type has been changed.
				613	*/
				614	bool set_data_type_if_unknown(ITensorInfo &info, DataType data_type);
				615
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	616	/** Set the data layout to the specified value if
Isabella Gottardi	d17a677	2018-02-27 17:41:55 +0000	[diff] [blame]	617	* the current data layout is unknown.
				618	*
				619	* @param[in,out] info Tensor info used to check and assign.
				620	* @param[in] data_layout New data layout.
				621	*
				622	* @return True if the data type has been changed.
				623	*/
				624	bool set_data_layout_if_unknown(ITensorInfo &info, DataLayout data_layout);
				625
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	626	/** Set the quantization info to the specified value if
Georgios Pinitas	05078ec	2017-11-02 13:06:59 +0000	[diff] [blame]	627	* the current quantization info is empty and the data type of asymmetric quantized type
				628	*
				629	* @param[in,out] info Tensor info used to check and assign.
				630	* @param[in] quantization_info Quantization info
				631	*
				632	* @return True if the quantization info has been changed.
				633	*/
				634	bool set_quantization_info_if_empty(ITensorInfo &info, QuantizationInfo quantization_info);
				635
Isabella Gottardi	1fab09f	2017-07-13 15:55:57 +0100	[diff] [blame]	636	/** Helper function to calculate the Valid Region for Scale.
				637	*
Diego Lopez Recas	0085429	2018-02-22 13:08:01 +0000	[diff] [blame]	638	* @param[in] src_info Input tensor info used to check.
				639	* @param[in] dst_shape Shape of the output.
				640	* @param[in] interpolate_policy Interpolation policy.
				641	* @param[in] sampling_policy Sampling policy.
				642	* @param[in] border_undefined True if the border is undefined.
Isabella Gottardi	1fab09f	2017-07-13 15:55:57 +0100	[diff] [blame]	643	*
Diego Lopez Recas	0085429	2018-02-22 13:08:01 +0000	[diff] [blame]	644	* @return The corresponding valid region
Isabella Gottardi	1fab09f	2017-07-13 15:55:57 +0100	[diff] [blame]	645	*/
Diego Lopez Recas	0085429	2018-02-22 13:08:01 +0000	[diff] [blame]	646	ValidRegion calculate_valid_region_scale(const ITensorInfo &src_info, const TensorShape &dst_shape,
				647	InterpolationPolicy interpolate_policy, SamplingPolicy sampling_policy, bool border_undefined);
Georgios Pinitas	05078ec	2017-11-02 13:06:59 +0000	[diff] [blame]	648
Georgios Pinitas	5ee66ea	2017-09-07 17:29:16 +0100	[diff] [blame]	649	/** Convert a linear index into n-dimensional coordinates.
				650	*
				651	* @param[in] shape Shape of the n-dimensional tensor.
				652	* @param[in] index Linear index specifying the i-th element.
				653	*
				654	* @return n-dimensional coordinates.
				655	*/
				656	inline Coordinates index2coords(const TensorShape &shape, int index);
Georgios Pinitas	05078ec	2017-11-02 13:06:59 +0000	[diff] [blame]	657
Georgios Pinitas	5ee66ea	2017-09-07 17:29:16 +0100	[diff] [blame]	658	/** Convert n-dimensional coordinates into a linear index.
				659	*
				660	* @param[in] shape Shape of the n-dimensional tensor.
				661	* @param[in] coord N-dimensional coordinates.
				662	*
				663	* @return linead index
				664	*/
				665	inline int coords2index(const TensorShape &shape, const Coordinates &coord);
Isabella Gottardi	d17a677	2018-02-27 17:41:55 +0000	[diff] [blame]	666
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	667	/** Get the index of the given dimension.
Isabella Gottardi	d17a677	2018-02-27 17:41:55 +0000	[diff] [blame]	668	*
Alex Gilday	c357c47	2018-03-21 13:54:09 +0000	[diff] [blame]	669	* @param[in] data_layout The data layout.
				670	* @param[in] data_layout_dimension The dimension which this index is requested for.
Isabella Gottardi	d17a677	2018-02-27 17:41:55 +0000	[diff] [blame]	671	*
				672	* @return The int conversion of the requested data layout index.
				673	*/
Isabella Gottardi	d56e770	2018-02-28 14:29:36 +0000	[diff] [blame]	674	inline size_t get_data_layout_dimension_index(const DataLayout data_layout, const DataLayoutDimension data_layout_dimension);
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	675
				676	/** Calculate the normalization dimension index for a given normalization type
				677	*
				678	* @param[in] layout Data layout of the input and output tensor
				679	* @param[in] info Normalization info
				680	*
				681	* @return Normalization dimension index
				682	*/
				683	inline unsigned int get_normalization_dimension_index(DataLayout layout, const NormalizationLayerInfo &info)
				684	{
				685	const unsigned int width_idx = get_data_layout_dimension_index(layout, DataLayoutDimension::WIDTH);
				686	const unsigned int channel_idx = get_data_layout_dimension_index(layout, DataLayoutDimension::CHANNEL);
				687
				688	return info.is_in_map() ? width_idx : channel_idx;
				689	}
				690
				691	/** Calculate the number of output tiles required by Winograd Convolution layer. This utility function can be used by the Winograd input transform
				692	* to know the number of tiles on the x and y direction
				693	*
				694	* @param[in] in_dims Spatial dimensions of the input tensor of convolution layer
				695	* @param[in] kernel_size Kernel size
				696	* @param[in] output_tile_size Size of a single output tile
				697	* @param[in] conv_info Convolution info (i.e. pad, stride,...)
				698	*
				699	* @return the number of output tiles along the x and y directions of size "output_tile_size"
				700	*/
				701	inline Size2D compute_winograd_convolution_tiles(const Size2D &in_dims, const Size2D &kernel_size, const Size2D &output_tile_size, const PadStrideInfo &conv_info)
				702	{
				703	int num_tiles_x = std::ceil((in_dims.width - (kernel_size.width - 1) + conv_info.pad_left() + conv_info.pad_right()) / static_cast<float>(output_tile_size.width));
				704	int num_tiles_y = std::ceil((in_dims.height - (kernel_size.height - 1) + conv_info.pad_top() + conv_info.pad_bottom()) / static_cast<float>(output_tile_size.height));
				705
				706	// Clamp in case we provide paddings but we have 1D convolution
				707	num_tiles_x = std::min(num_tiles_x, static_cast<int>(in_dims.width));
				708	num_tiles_y = std::min(num_tiles_y, static_cast<int>(in_dims.height));
				709
				710	return Size2D(num_tiles_x, num_tiles_y);
				711	}
				712
Gian Marco Iodice	8aa985e	2018-11-27 15:58:08 +0000	[diff] [blame^]	713	/** Wrap-around a number within the range 0 <= x < m
				714	*
				715	* @param[in] x Input value
				716	* @param[in] m Range
				717	*
				718	* @return the wrapped-around number
				719	*/
				720	template <typename T>
				721	inline T wrap_around(T x, T m)
				722	{
				723	return x >= 0 ? x % m : (x % m + m) % m;
				724	}
Anthony Barbier	6ff3b19	2017-09-04 18:44:23 +0100	[diff] [blame]	725	} // namespace arm_compute
				726
				727	#include "arm_compute/core/Helpers.inl"
				728	#endif /__ARM_COMPUTE_HELPERS_H__ /