Blame - arm_compute/core/utils/misc/ShapeCalculator.h - ml/ComputeLibrary

blob: 8a00c22306be8cdea86d05d11990484d91fbb005 [file] [log] [blame]

Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	1	/*
Gian Marco	36a0a46	2018-01-12 10:21:40 +0000	[diff] [blame]	2	* Copyright (c) 2017-2018 ARM Limited.
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	3	*
				4	* SPDX-License-Identifier: MIT
				5	*
				6	* Permission is hereby granted, free of charge, to any person obtaining a copy
				7	* of this software and associated documentation files (the "Software"), to
				8	* deal in the Software without restriction, including without limitation the
				9	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
				10	* sell copies of the Software, and to permit persons to whom the Software is
				11	* furnished to do so, subject to the following conditions:
				12	*
				13	* The above copyright notice and this permission notice shall be included in all
				14	* copies or substantial portions of the Software.
				15	*
				16	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				17	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				18	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
				19	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				20	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				21	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				22	* SOFTWARE.
				23	*/
				24	#ifndef __ARM_COMPUTE_MISC_SHAPE_CALCULATOR_H__
				25	#define __ARM_COMPUTE_MISC_SHAPE_CALCULATOR_H__
				26
Georgios Pinitas	9be0c5a	2018-02-19 12:46:29 +0000	[diff] [blame]	27	#include "arm_compute/core/Helpers.h"
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	28	#include "arm_compute/core/ITensorInfo.h"
Georgios Pinitas	1250a5a	2018-01-02 13:27:37 +0000	[diff] [blame]	29	#include "arm_compute/core/Utils.h"
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	30
Gian Marco Iodice	d2fab73	2018-03-02 11:18:12 +0000	[diff] [blame]	31	#include <cmath>
				32
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	33	namespace arm_compute
				34	{
				35	namespace misc
				36	{
				37	namespace shape_calculator
				38	{
Abe Mbise	7784c83	2018-05-31 16:48:41 +0100	[diff] [blame]	39	inline TensorShape compute_vector_to_tensor_output_shape(const TensorShape &input, size_t conv_w, size_t conv_h, const DataLayout &data_layout)
				40	{
				41	const size_t idx_w = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
				42	const size_t idx_h = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
				43	const size_t idx_c = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);
				44
				45	TensorShape output_shape(input);
				46	output_shape.set(idx_w, conv_w);
				47	output_shape.set(idx_h, conv_h);
				48	output_shape.set(idx_c, input.x() / (conv_w * conv_h));
				49
				50	return output_shape;
				51	}
Pablo Tello	00afd11	2018-01-04 10:34:24 +0000	[diff] [blame]	52	inline TensorShape compute_permutation_output_shape(const ITensorInfo &input, const PermutationVector &perm)
				53	{
				54	TensorShape output_shape = input.tensor_shape();
				55	permute(output_shape, perm);
				56	return output_shape;
				57	}
Giorgio Arena	c6aa49b	2018-08-07 11:53:30 +0100	[diff] [blame]	58	inline TensorShape compute_weights_reshaped_shape(const ITensorInfo &weights, bool has_bias = false, const unsigned int num_groups = 1)
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	59	{
Giorgio Arena	088c2b0	2018-08-07 16:59:05 +0100	[diff] [blame]	60	// Number of groups greater than one are only supported for NCHW data layout, and the number of weights must be a multiple of it.
				61
Giorgio Arena	c6aa49b	2018-08-07 11:53:30 +0100	[diff] [blame]	62	ARM_COMPUTE_ERROR_ON(num_groups == 0);
				63	ARM_COMPUTE_ERROR_ON((weights.dimension(3) % num_groups) != 0);
				64	ARM_COMPUTE_ERROR_ON(weights.data_layout() == DataLayout::NHWC && num_groups > 1);
				65
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	66	// Calculate output shape
				67	TensorShape weights_reshaped{ weights.tensor_shape() };
				68	weights_reshaped.collapse(3);
				69	const size_t tmp_dim = weights_reshaped[0];
Giorgio Arena	c6aa49b	2018-08-07 11:53:30 +0100	[diff] [blame]	70	weights_reshaped.set(0, weights_reshaped[1] / num_groups);
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	71	weights_reshaped.set(1, tmp_dim + (has_bias ? 1 : 0));
Giorgio Arena	c6aa49b	2018-08-07 11:53:30 +0100	[diff] [blame]	72	if(weights.num_dimensions() < 5)
				73	{
				74	weights_reshaped.set(2, num_groups);
				75	}
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	76
				77	return weights_reshaped;
				78	}
Gian Marco Iodice	68a3f56	2018-07-26 11:44:03 +0100	[diff] [blame]	79	inline TensorShape compute_interleaved_shape(const ITensorInfo &a, int mult_interleave4x4_height = 1, bool reinterpret_input_as_3d = false)
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	80	{
Gian Marco	36a0a46	2018-01-12 10:21:40 +0000	[diff] [blame]	81	// The interleaved output matrix will have the following shape: [ a_height * W, ceil(a_width / W) ] where W = 4 * mult_interleave4x4_height
				82	ARM_COMPUTE_ERROR_ON(mult_interleave4x4_height < 1);
				83	const int interleave_width = 4 * mult_interleave4x4_height;
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	84	TensorShape shape_interleaved_a{ a.tensor_shape() };
Gian Marco	36a0a46	2018-01-12 10:21:40 +0000	[diff] [blame]	85	shape_interleaved_a.set(0, a.dimension(0) * interleave_width);
Gian Marco Iodice	68a3f56	2018-07-26 11:44:03 +0100	[diff] [blame]	86	if(reinterpret_input_as_3d)
				87	{
				88	const int M = a.dimension(1) * a.dimension(2);
				89	const int height = std::ceil(M / static_cast<float>(interleave_width));
				90	shape_interleaved_a.set(1, height);
				91	shape_interleaved_a.remove_dimension(2);
				92	}
				93	else
				94	{
				95	shape_interleaved_a.set(1, std::ceil(a.dimension(1) / static_cast<float>(interleave_width)));
				96	}
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	97
				98	return shape_interleaved_a;
				99	}
				100	inline TensorShape compute_transpose1xW_shape(const ITensorInfo &b)
				101	{
				102	// The transpose1xW output matrix will have the following shape: [ b_height * 16, ceil(b_width / 16.0f) ]
				103	TensorShape shape_transposed1xW_b{ b.tensor_shape() };
				104	shape_transposed1xW_b.set(0, b.dimension(1) * 16);
				105	shape_transposed1xW_b.set(1, std::ceil(b.dimension(0) / 16.f));
				106
				107	return shape_transposed1xW_b;
				108	}
Gian Marco	36a0a46	2018-01-12 10:21:40 +0000	[diff] [blame]	109	inline TensorShape compute_transpose1xW_with_element_size_shape(const ITensorInfo &b, int mult_transpose1xW_width = 1)
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	110	{
Gian Marco	36a0a46	2018-01-12 10:21:40 +0000	[diff] [blame]	111	// Note: mult_transpose1xW_width expresses the number of chunks with size 1x(W) we want to store on the same row
				112	// The transpose1xW output matrix will have the following shape:
				113	// [ b_height * W, ceil(b_width / W) ] where W = (16 / element size of the tensor) * mult_transpose1xW_width
				114	ARM_COMPUTE_ERROR_ON(mult_transpose1xW_width < 1);
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	115	TensorShape shape_transposed1xW_b{ b.tensor_shape() };
Gian Marco	36a0a46	2018-01-12 10:21:40 +0000	[diff] [blame]	116	const size_t transpose_width = (16 / b.element_size()) * mult_transpose1xW_width;
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	117	shape_transposed1xW_b.set(0, b.dimension(1) * transpose_width);
				118	shape_transposed1xW_b.set(1, static_cast<size_t>(std::ceil(b.dimension(0) / static_cast<float>(transpose_width))));
				119
				120	return shape_transposed1xW_b;
				121	}
				122	inline TensorShape compute_reductionA_shape(const ITensorInfo &b)
				123	{
				124	TensorShape shape_vector_sum_col{ b.tensor_shape() };
				125	if(shape_vector_sum_col.num_dimensions() > 1)
				126	{
				127	shape_vector_sum_col.remove_dimension(1);
				128	}
				129
				130	return shape_vector_sum_col;
				131	}
				132	inline TensorShape compute_reductionB_shape(const ITensorInfo &a)
				133	{
				134	TensorShape shape_vector_sum_row{ a.tensor_shape() };
				135	shape_vector_sum_row.set(Window::DimX, a.dimension(1));
				136	if(a.num_dimensions() > 1)
				137	{
				138	shape_vector_sum_row.remove_dimension(1);
				139	}
				140
				141	return shape_vector_sum_row;
				142	}
Michele Di Giorgio	980002b	2018-08-08 09:25:51 +0100	[diff] [blame]	143	inline TensorShape compute_col2im_shape(const ITensorInfo &input, std::pair<unsigned int, unsigned int> convolved_dims, unsigned int num_groups = 1)
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	144	{
Michele Di Giorgio	980002b	2018-08-08 09:25:51 +0100	[diff] [blame]	145	ARM_COMPUTE_ERROR_ON(num_groups == 0);
				146	ARM_COMPUTE_ERROR_ON(input.tensor_shape()[1] != (convolved_dims.first * convolved_dims.second));
				147	ARM_COMPUTE_ERROR_ON((num_groups > 1) && input.tensor_shape()[2] != num_groups);
				148
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	149	TensorShape col2im_shape{ input.tensor_shape() };
				150	col2im_shape.set(0, convolved_dims.first);
				151	col2im_shape.set(1, convolved_dims.second);
Michele Di Giorgio	980002b	2018-08-08 09:25:51 +0100	[diff] [blame]	152	col2im_shape.set(2, input.tensor_shape()[0] * num_groups);
				153
				154	const unsigned int batch_idx = (num_groups == 1) ? 2 : 3;
				155	col2im_shape.set(3, input.tensor_shape()[batch_idx]);
Georgios Pinitas	78c0090	2018-01-09 17:33:11 +0000	[diff] [blame]	156
				157	return col2im_shape;
				158	}
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	159	inline TensorShape compute_transposed_shape(const ITensorInfo &input)
				160	{
				161	TensorShape shape_transposed{ input.tensor_shape() };
				162
				163	shape_transposed.set(0, input.dimension(1));
				164	shape_transposed.set(1, input.dimension(0));
				165
				166	return shape_transposed;
				167	}
Giorgio Arena	7657224	2018-04-04 17:44:26 +0100	[diff] [blame]	168	inline TensorShape compute_depthwise_convolution_shape(const ITensorInfo &input, const ITensorInfo &weights, PadStrideInfo conv_info, unsigned int depth_multiplier)
Georgios Pinitas	1250a5a	2018-01-02 13:27:37 +0000	[diff] [blame]	169	{
				170	const TensorShape input_shape{ input.tensor_shape() };
				171	const TensorShape weights_shape{ weights.tensor_shape() };
				172
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	173	const DataLayout data_layout = input.data_layout();
				174	const int width_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
				175	const int height_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
Giorgio Arena	7657224	2018-04-04 17:44:26 +0100	[diff] [blame]	176	const int channel_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	177
Georgios Pinitas	1250a5a	2018-01-02 13:27:37 +0000	[diff] [blame]	178	unsigned int output_width = 0;
				179	unsigned int output_height = 0;
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	180	std::tie(output_width, output_height) = scaled_dimensions(input_shape[width_idx], input_shape[height_idx],
				181	weights_shape[width_idx], weights_shape[height_idx],
Georgios Pinitas	d05dce4	2018-01-22 16:29:17 +0000	[diff] [blame]	182	conv_info);
Georgios Pinitas	1250a5a	2018-01-02 13:27:37 +0000	[diff] [blame]	183
				184	TensorShape output_shape{ input_shape };
Giorgio Arena	dfca60b	2018-01-31 10:30:59 +0000	[diff] [blame]	185	output_shape.set(width_idx, output_width);
				186	output_shape.set(height_idx, output_height);
Giorgio Arena	7657224	2018-04-04 17:44:26 +0100	[diff] [blame]	187	output_shape.set(channel_idx, input_shape[channel_idx] * depth_multiplier);
Georgios Pinitas	1250a5a	2018-01-02 13:27:37 +0000	[diff] [blame]	188
				189	return output_shape;
				190	}
Michalis Spyrou	780db4e	2017-11-23 09:49:51 +0000	[diff] [blame]	191	inline TensorShape compute_deconvolution_shape(const ITensorInfo &input, unsigned int sx, unsigned int sy, unsigned int inner_border_right, unsigned int inner_border_top, const PadStrideInfo &info)
				192	{
				193	TensorShape scale_out_shape(input.tensor_shape());
				194	const unsigned int out_x = input.dimension(0) + (input.dimension(0) - 1) * (sx - 1) + inner_border_right + 2 * info.pad().first;
				195	const unsigned int out_y = input.dimension(1) + (input.dimension(1) - 1) * (sy - 1) + inner_border_top + 2 * info.pad().second;
				196	scale_out_shape.set(0, out_x);
				197	scale_out_shape.set(1, out_y);
				198
				199	return scale_out_shape;
				200	}
Giorgio Arena	0f17039	2018-07-18 16:13:12 +0100	[diff] [blame]	201	inline TensorShape compute_im2col_conv_shape(const ITensorInfo *input, const Size2D &kernel_dims, const PadStrideInfo &conv_info, bool has_bias, const Size2D &dilation, bool batch_size_on_z,
				202	unsigned int num_groups = 1)
Giorgio Arena	156fcf3	2018-03-09 15:30:43 +0000	[diff] [blame]	203	{
Giorgio Arena	0f17039	2018-07-18 16:13:12 +0100	[diff] [blame]	204	// The output shape will be the 3D shape [ out_channels * kernel_area, num_elems_per_out_channel, batches ] if batch_size_on_z == true
				205	// or the 4D shape [ out_channels * kernel_area / num_groups, num_elems_per_out_channel, num_groups, batches ] if batch_size_on_z == false
				206
				207	ARM_COMPUTE_ERROR_ON(num_groups == 0);
				208	ARM_COMPUTE_ERROR_ON(num_groups > 1 && input->data_layout() != DataLayout::NCHW);
				209	ARM_COMPUTE_ERROR_ON(num_groups > 1 && batch_size_on_z);
Giorgio Arena	156fcf3	2018-03-09 15:30:43 +0000	[diff] [blame]	210
				211	TensorShape output_shape{ input->tensor_shape() };
				212
				213	const DataLayout data_layout = input->data_layout();
				214	const int width_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH);
				215	const int height_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT);
				216	const int channel_idx = get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL);
				217
				218	std::pair<unsigned int, unsigned int> out_dims = scaled_dimensions(output_shape[width_idx], output_shape[height_idx], kernel_dims.width, kernel_dims.height, conv_info, dilation);
Giorgio Arena	0f17039	2018-07-18 16:13:12 +0100	[diff] [blame]	219	output_shape.set(0, (output_shape[channel_idx] / num_groups * kernel_dims.area() + (has_bias ? 1 : 0))); // NOLINT
Giorgio Arena	f485a10	2018-04-20 16:06:21 +0100	[diff] [blame]	220	output_shape.set(1, (out_dims.first * out_dims.second));
Gian Marco Iodice	597a856	2018-08-01 15:06:06 +0100	[diff] [blame]	221	if(batch_size_on_z && output_shape.num_dimensions() >= 3)
				222	{
				223	output_shape.remove_dimension(2);
				224	}
				225	else
				226	{
Giorgio Arena	0f17039	2018-07-18 16:13:12 +0100	[diff] [blame]	227	output_shape.set(2, num_groups);
Gian Marco Iodice	597a856	2018-08-01 15:06:06 +0100	[diff] [blame]	228	}
Giorgio Arena	156fcf3	2018-03-09 15:30:43 +0000	[diff] [blame]	229
				230	return output_shape;
				231	}
Gian Marco Iodice	215b4ea	2018-06-28 16:29:29 +0100	[diff] [blame]	232	inline TensorShape compute_flatten_shape(const ITensorInfo *input)
Ioan-Cristian Szabo	b4e3e1c	2017-11-30 17:17:17 +0000	[diff] [blame]	233	{
Gian Marco Iodice	215b4ea	2018-06-28 16:29:29 +0100	[diff] [blame]	234	// The output shape will be the flatten version of the input (i.e. [ width * height * channels, num_batches, ... ] ). Used for FlattenLayer and FullyConnectedLayer.
				235
Ioan-Cristian Szabo	b4e3e1c	2017-11-30 17:17:17 +0000	[diff] [blame]	236	TensorShape output_shape{ input->tensor_shape() };
				237
Gian Marco Iodice	215b4ea	2018-06-28 16:29:29 +0100	[diff] [blame]	238	output_shape.collapse(3);
Giorgio Arena	156fcf3	2018-03-09 15:30:43 +0000	[diff] [blame]	239
				240	return output_shape;
				241	}
Ioan-Cristian Szabo	b4e3e1c	2017-11-30 17:17:17 +0000	[diff] [blame]	242	inline TensorShape compute_interleave_custom_shape(const TensorShape &input, const int x_interleave, const int y_interleave)
				243	{
				244	TensorShape output_shape{ input };
				245
				246	output_shape.set(0, output_shape.x() * x_interleave);
				247	output_shape.set(1, std::ceil(output_shape.y() / static_cast<float>(y_interleave)));
				248
				249	return output_shape;
				250	}
Ioan-Cristian Szabo	b4e3e1c	2017-11-30 17:17:17 +0000	[diff] [blame]	251	inline TensorShape compute_fully_connected_reshaped_weights_shape(const ITensorInfo *input, bool transpose_weights, bool is_batched_fc_layer, const int interleave)
				252	{
				253	TensorShape output_shape{ input->tensor_shape() };
				254
				255	// Transpose weights if the user hasn't done it
				256	if(transpose_weights)
				257	{
				258	output_shape = compute_transposed_shape(*input);
				259	}
				260
Gian Marco Iodice	7e4b239	2018-02-22 16:17:20 +0000	[diff] [blame]	261	// If we run multiple batches we need 1xW transpose, too.
Ioan-Cristian Szabo	b4e3e1c	2017-11-30 17:17:17 +0000	[diff] [blame]	262	if(is_batched_fc_layer)
				263	{
				264	output_shape = compute_transposed_shape(input->clone()->set_tensor_shape(output_shape));
				265	output_shape = compute_interleave_custom_shape(output_shape, interleave, interleave);
				266	}
				267
				268	return output_shape;
				269	}
Gian Marco Iodice	7e4b239	2018-02-22 16:17:20 +0000	[diff] [blame]	270
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	271	inline TensorShape compute_winograd_filter_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
Gian Marco Iodice	7e4b239	2018-02-22 16:17:20 +0000	[diff] [blame]	272	{
Gian Marco Iodice	7e4b239	2018-02-22 16:17:20 +0000	[diff] [blame]	273	TensorShape tensor_shape{ input.tensor_shape() };
				274
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	275	const Size2D kernel_size = winograd_info.kernel_size;
				276	const Size2D output_tile_size = winograd_info.output_tile_size;
				277	const Size2D input_tile_size = Size2D(output_tile_size.width + kernel_size.width - 1, output_tile_size.height + kernel_size.height - 1);
Giorgio Arena	2d9de0a	2018-03-15 17:58:20 +0000	[diff] [blame]	278
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	279	tensor_shape.remove_dimension(get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH));
				280	tensor_shape.set(Window::DimX, input.dimension(3));
				281	tensor_shape.set(Window::DimY, input.dimension(get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::CHANNEL)));
				282	tensor_shape.set(Window::DimZ, input_tile_size.area());
Gian Marco Iodice	7e4b239	2018-02-22 16:17:20 +0000	[diff] [blame]	283
				284	return tensor_shape;
				285	}
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	286	inline TensorShape compute_winograd_input_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
Giorgio Arena	1f9ca1d	2018-03-01 11:13:45 +0000	[diff] [blame]	287	{
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	288	const PadStrideInfo conv_info = winograd_info.convolution_info;
				289	const Size2D kernel_size = winograd_info.kernel_size;
				290	const Size2D output_tile_size = winograd_info.output_tile_size;
				291	const Size2D input_tile_size = Size2D(output_tile_size.width + kernel_size.width - 1, output_tile_size.height + kernel_size.height - 1);
				292
Giorgio Arena	c42f28d	2018-04-26 11:33:05 +0100	[diff] [blame]	293	const size_t idx_w = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
				294	const size_t idx_h = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);
				295	const size_t idx_c = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::CHANNEL);
Giorgio Arena	1f9ca1d	2018-03-01 11:13:45 +0000	[diff] [blame]	296
Gian Marco Iodice	f1c2bf0	2018-06-13 14:05:54 +0100	[diff] [blame]	297	// Compute the number of output tiles along the x and y direction of size "output_tile_size"
				298	const Size2D num_tiles = compute_winograd_convolution_tiles(Size2D(input.tensor_shape()[idx_w], input.tensor_shape()[idx_h]),
				299	kernel_size,
				300	output_tile_size,
				301	conv_info);
Giorgio Arena	c42f28d	2018-04-26 11:33:05 +0100	[diff] [blame]	302
				303	const unsigned int width = input.tensor_shape()[idx_c];
Gian Marco Iodice	f1c2bf0	2018-06-13 14:05:54 +0100	[diff] [blame]	304	const unsigned int height = num_tiles.area();
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	305	const unsigned int depth = input_tile_size.area();
Giorgio Arena	1f9ca1d	2018-03-01 11:13:45 +0000	[diff] [blame]	306
				307	TensorShape output_shape{ input.tensor_shape() };
				308	output_shape.set(0, width);
				309	output_shape.set(1, height);
				310	output_shape.set(2, depth);
				311
				312	return output_shape;
				313	}
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	314	inline TensorShape compute_winograd_output_transform_shape(const ITensorInfo &input, const WinogradInfo &winograd_info)
Gian Marco Iodice	d2fab73	2018-03-02 11:18:12 +0000	[diff] [blame]	315	{
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	316	const PadStrideInfo conv_info = winograd_info.convolution_info;
				317	const Size2D kernel_size = winograd_info.kernel_size;
				318	const Size2D input_dimensions = winograd_info.input_dimensions;
				319	const DataLayout data_layout = winograd_info.output_data_layout;
				320
				321	// Compute output shape
				322	unsigned int output_width = 0;
				323	unsigned int output_height = 0;
				324	std::tie(output_width, output_height) = scaled_dimensions(input_dimensions.width, input_dimensions.height,
				325	kernel_size.width, kernel_size.height, conv_info);
				326
Gian Marco Iodice	d2fab73	2018-03-02 11:18:12 +0000	[diff] [blame]	327	TensorShape tensor_shape{ input.tensor_shape() };
				328
				329	// Output dimension
Gian Marco Iodice	247f52c	2018-03-22 11:24:56 +0000	[diff] [blame]	330	const unsigned int out_w = output_width;
				331	const unsigned int out_h = output_height;
Gian Marco Iodice	d2fab73	2018-03-02 11:18:12 +0000	[diff] [blame]	332	const unsigned int out_c = input.dimension(0);
				333
				334	tensor_shape.set(get_data_layout_dimension_index(data_layout, DataLayoutDimension::WIDTH), out_w);
				335	tensor_shape.set(get_data_layout_dimension_index(data_layout, DataLayoutDimension::HEIGHT), out_h);
				336	tensor_shape.set(get_data_layout_dimension_index(data_layout, DataLayoutDimension::CHANNEL), out_c);
				337
				338	return tensor_shape;
				339	}
Georgios Pinitas	d8734b5	2017-12-22 15:27:52 +0000	[diff] [blame]	340	inline TensorShape compute_deep_convolution_shape(const ITensorInfo &input, const ITensorInfo &weights, PadStrideInfo conv_info)
				341	{
				342	const TensorShape input_shape{ input.tensor_shape() };
				343	const TensorShape weights_shape{ weights.tensor_shape() };
				344
Gian Marco Iodice	d2fab73	2018-03-02 11:18:12 +0000	[diff] [blame]	345	const size_t idx_width = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
				346	const size_t idx_height = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);
				347	const size_t idx_channel = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::CHANNEL);
				348
Giorgio Arena	c0f5443	2018-03-16 14:02:34 +0000	[diff] [blame]	349	const unsigned int input_width = input_shape[idx_width];
				350	const unsigned int input_height = input_shape[idx_height];
				351	const unsigned int weights_width = weights_shape[idx_width];
				352	const unsigned int weights_height = weights_shape[idx_height];
				353	const unsigned int weights_out_channel = weights_shape[3];
				354	unsigned int output_width = 0;
				355	unsigned int output_height = 0;
Gian Marco Iodice	d2fab73	2018-03-02 11:18:12 +0000	[diff] [blame]	356	std::tie(output_width, output_height) = scaled_dimensions(input_width, input_height, weights_width, weights_height, conv_info);
Georgios Pinitas	d8734b5	2017-12-22 15:27:52 +0000	[diff] [blame]	357
				358	TensorShape output_shape{ input_shape };
Gian Marco Iodice	d2fab73	2018-03-02 11:18:12 +0000	[diff] [blame]	359	output_shape.set(idx_width, output_width);
				360	output_shape.set(idx_height, output_height);
Giorgio Arena	c0f5443	2018-03-16 14:02:34 +0000	[diff] [blame]	361	output_shape.set(idx_channel, weights_out_channel);
Georgios Pinitas	d8734b5	2017-12-22 15:27:52 +0000	[diff] [blame]	362
				363	return output_shape;
				364	}
Alex Gilday	60954c6	2018-03-05 16:22:48 +0000	[diff] [blame]	365	inline TensorShape compute_min_max_shape(const ITensorInfo *input)
				366	{
				367	TensorShape output_shape{ input->tensor_shape() };
				368	output_shape.set(Window::DimX, 2);
				369	output_shape.remove_dimension(1);
				370	output_shape.remove_dimension(1);
				371
				372	return output_shape;
				373	}
				374
Michalis Spyrou	e74b201	2018-04-18 09:49:16 +0100	[diff] [blame]	375	inline TensorShape compute_pool_shape(const ITensorInfo &input, PoolingLayerInfo pool_info)
				376	{
				377	unsigned int pooled_w = 0;
				378	unsigned int pooled_h = 0;
				379
Giorgio Arena	3c520c5	2018-05-01 11:47:24 +0100	[diff] [blame]	380	TensorShape output_shape{ input.tensor_shape() };
Michalis Spyrou	e74b201	2018-04-18 09:49:16 +0100	[diff] [blame]	381
Giorgio Arena	3c520c5	2018-05-01 11:47:24 +0100	[diff] [blame]	382	const bool is_global_pooling = pool_info.is_global_pooling();
				383	const unsigned int idx_width = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::WIDTH);
				384	const unsigned int idx_height = get_data_layout_dimension_index(input.data_layout(), DataLayoutDimension::HEIGHT);
				385	const unsigned int pool_size_x = is_global_pooling ? output_shape[idx_width] : pool_info.pool_size().width;
				386	const unsigned int pool_size_y = is_global_pooling ? output_shape[idx_height] : pool_info.pool_size().height;
				387
				388	std::tie(pooled_w, pooled_h) = scaled_dimensions(output_shape[idx_width],
				389	output_shape[idx_height],
Michalis Spyrou	e74b201	2018-04-18 09:49:16 +0100	[diff] [blame]	390	pool_size_x,
				391	pool_size_y,
				392	pool_info.pad_stride_info());
				393
Giorgio Arena	3c520c5	2018-05-01 11:47:24 +0100	[diff] [blame]	394	output_shape.set(idx_width, pooled_w);
				395	output_shape.set(idx_height, pooled_h);
Michalis Spyrou	e74b201	2018-04-18 09:49:16 +0100	[diff] [blame]	396
				397	return output_shape;
				398	}
				399
Michalis Spyrou	36a559e	2018-03-20 10:30:58 +0000	[diff] [blame]	400	inline TensorShape compute_rnn_shape(const ITensorInfo *input, const unsigned int batch_size)
				401	{
				402	TensorShape output_shape{ input->tensor_shape() };
				403	output_shape.set(1, batch_size);
				404
				405	return output_shape;
				406	}
Gian Marco Iodice	750641d	2018-05-08 12:01:57 +0100	[diff] [blame]	407	inline TensorShape compute_mm_shape(const ITensorInfo &input0, const ITensorInfo &input1, bool is_interleaved_transposed, const GEMMReshapeInfo &reshape_info)
				408	{
Isabella Gottardi	8e74f44	2018-03-01 16:42:00 +0000	[diff] [blame]	409	ARM_COMPUTE_ERROR_ON_MSG(input0.num_dimensions() > 4, "The number of dimensions for the matrix A must be <= 4");
Gian Marco Iodice	68a3f56	2018-07-26 11:44:03 +0100	[diff] [blame]	410	ARM_COMPUTE_ERROR_ON_MSG(is_interleaved_transposed && reshape_info.reinterpret_input_as_3d(), "The first input tensor cannot be reinterpreted as 3D if is_interleaved_transposed is true");
Gian Marco Iodice	750641d	2018-05-08 12:01:57 +0100	[diff] [blame]	411
Gian Marco Iodice	68a3f56	2018-07-26 11:44:03 +0100	[diff] [blame]	412	const bool reinterpret_input_as_3d = reshape_info.reinterpret_input_as_3d();
				413	const bool reinterpret_output_as_3d = reshape_info.depth_output_gemm3d() != 1;
				414	const int m = reshape_info.reinterpret_input_as_3d() ? input0.dimension(1) * input0.dimension(2) : input0.dimension(1);
Isabella Gottardi	8e74f44	2018-03-01 16:42:00 +0000	[diff] [blame]	415
				416	// If the output of GEMM has to be reinterpreted as 3D, the number of input0 rows (M) is obtained collapsing the second and third
				417	// dimension of the output tensor
				418	const int dim0 = is_interleaved_transposed ? reshape_info.n() : input1.dimension(0);
Gian Marco Iodice	68a3f56	2018-07-26 11:44:03 +0100	[diff] [blame]	419	const int dim1 = is_interleaved_transposed ? reshape_info.m() / reshape_info.depth_output_gemm3d() : m / reshape_info.depth_output_gemm3d();
				420	const int dim2 = reinterpret_input_as_3d ? input0.tensor_shape()[3] : input0.tensor_shape()[2];
				421	const int dim3 = reinterpret_input_as_3d ? 1 : input0.tensor_shape()[3];
Isabella Gottardi	8e74f44	2018-03-01 16:42:00 +0000	[diff] [blame]	422
				423	TensorShape output_shape{ input0.tensor_shape() };
				424
				425	output_shape.set(0, dim0);
				426	output_shape.set(1, dim1);
Gian Marco Iodice	68a3f56	2018-07-26 11:44:03 +0100	[diff] [blame]	427	output_shape.set(2, reinterpret_output_as_3d ? reshape_info.depth_output_gemm3d() : dim2);
				428	output_shape.set(3, reinterpret_output_as_3d ? dim2 : dim3);
				429	output_shape.set(4, reinterpret_output_as_3d ? dim3 : 1);
Isabella Gottardi	8e74f44	2018-03-01 16:42:00 +0000	[diff] [blame]	430
				431	return output_shape;
Gian Marco Iodice	750641d	2018-05-08 12:01:57 +0100	[diff] [blame]	432	}
Michalis Spyrou	55b3d12	2018-05-09 09:59:23 +0100	[diff] [blame]	433
				434	template <typename T>
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	435	inline TensorShape extract_shape(T *data)
Michalis Spyrou	55b3d12	2018-05-09 09:59:23 +0100	[diff] [blame]	436	{
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	437	return data->info()->tensor_shape();
Michalis Spyrou	55b3d12	2018-05-09 09:59:23 +0100	[diff] [blame]	438	}
				439
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	440	inline TensorShape extract_shape(ITensorInfo *data)
Michalis Spyrou	55b3d12	2018-05-09 09:59:23 +0100	[diff] [blame]	441	{
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	442	return data->tensor_shape();
				443	}
				444
				445	inline TensorShape extract_shape(const TensorShape *data)
				446	{
				447	return *data;
Michalis Spyrou	55b3d12	2018-05-09 09:59:23 +0100	[diff] [blame]	448	}
				449
				450	template <typename T>
Georgios Pinitas	e29acf1	2018-07-16 14:40:09 +0100	[diff] [blame]	451	inline TensorShape calculate_depth_concatenate_shape(const std::vector<T *> &inputs_vector)
				452	{
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	453	TensorShape out_shape = extract_shape(inputs_vector[0]);
Georgios Pinitas	e29acf1	2018-07-16 14:40:09 +0100	[diff] [blame]	454
				455	size_t max_x = 0;
				456	size_t max_y = 0;
				457	size_t depth = 0;
				458
				459	for(const auto &tensor : inputs_vector)
				460	{
				461	ARM_COMPUTE_ERROR_ON(tensor == nullptr);
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	462	const TensorShape shape = extract_shape(tensor);
Georgios Pinitas	e29acf1	2018-07-16 14:40:09 +0100	[diff] [blame]	463	max_x = std::max(shape.x(), max_x);
				464	max_y = std::max(shape.y(), max_y);
				465	depth += shape.z();
				466	}
				467
				468	out_shape.set(0, max_x);
				469	out_shape.set(1, max_y);
				470	out_shape.set(2, depth);
				471
				472	return out_shape;
				473	}
				474
				475	template <typename T>
Michalis Spyrou	55b3d12	2018-05-09 09:59:23 +0100	[diff] [blame]	476	inline TensorShape calculate_width_concatenate_shape(const std::vector<T *> &inputs_vector)
				477	{
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	478	TensorShape out_shape = extract_shape(inputs_vector[0]);
Michalis Spyrou	55b3d12	2018-05-09 09:59:23 +0100	[diff] [blame]	479
				480	size_t width = 0;
				481	for(const auto &tensor : inputs_vector)
				482	{
				483	ARM_COMPUTE_ERROR_ON(tensor == nullptr);
Georgios Pinitas	e222055	2018-07-20 13:23:44 +0100	[diff] [blame]	484	const TensorShape shape = extract_shape(tensor);
Michalis Spyrou	55b3d12	2018-05-09 09:59:23 +0100	[diff] [blame]	485	width += shape.x();
				486	}
				487
				488	out_shape.set(0, width);
				489
				490	return out_shape;
				491	}
Georgios Pinitas	358ca20	2017-12-07 16:47:52 +0000	[diff] [blame]	492	} // namespace shape_calculator
				493	} // namespace misc
				494	} // namespace arm_compute
				495	#endif /* __ARM_COMPUTE_MISC_SHAPE_CALCULATOR_H__ */