Blame - arm_compute/core/KernelDescriptors.h - ml/ComputeLibrary

blob: 4b04bebdeffe66258743a9c38d62fb7ec144c74c [file] [log] [blame]

Georgios Pinitas	0bc7849	2019-03-18 20:07:37 +0000	[diff] [blame]	1	/*
Michele Di Giorgio	4536193	2019-12-19 13:53:44 +0000	[diff] [blame]	2	* Copyright (c) 2019-2020 ARM Limited.
Georgios Pinitas	0bc7849	2019-03-18 20:07:37 +0000	[diff] [blame]	3	*
				4	* SPDX-License-Identifier: MIT
				5	*
				6	* Permission is hereby granted, free of charge, to any person obtaining a copy
				7	* of this software and associated documentation files (the "Software"), to
				8	* deal in the Software without restriction, including without limitation the
				9	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
				10	* sell copies of the Software, and to permit persons to whom the Software is
				11	* furnished to do so, subject to the following conditions:
				12	*
				13	* The above copyright notice and this permission notice shall be included in all
				14	* copies or substantial portions of the Software.
				15	*
				16	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				17	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				18	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
				19	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				20	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				21	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				22	* SOFTWARE.
				23	*/
Michalis Spyrou	f464337	2019-11-29 16:17:13 +0000	[diff] [blame]	24	#ifndef ARM_COMPUTE_CORE_KERNEL_DESCRIPTORS_H
				25	#define ARM_COMPUTE_CORE_KERNEL_DESCRIPTORS_H
Georgios Pinitas	0bc7849	2019-03-18 20:07:37 +0000	[diff] [blame]	26
Gian Marco Iodice	ca1f460	2019-07-16 15:46:48 +0100	[diff] [blame]	27	#include "arm_compute/core/Types.h"
				28
Georgios Pinitas	0bc7849	2019-03-18 20:07:37 +0000	[diff] [blame]	29	namespace arm_compute
				30	{
Georgios Pinitas	8be9148	2019-03-26 17:23:28 +0000	[diff] [blame]	31	/** Descriptor for FFT scale kernels */
				32	struct FFTScaleKernelInfo
Georgios Pinitas	0bc7849	2019-03-18 20:07:37 +0000	[diff] [blame]	33	{
Georgios Pinitas	8be9148	2019-03-26 17:23:28 +0000	[diff] [blame]	34	float scale{ 0.f }; /*< Axis to perform the kernel on. /
				35	bool conjugate{ true }; /*< Flag to conjugate the output/ /
				36	};
				37
				38	/** Descriptor for FFT digit reverse kernels */
				39	struct FFTDigitReverseKernelInfo
				40	{
				41	unsigned int axis{ 0 }; /*< Axis to perform the kernel on. /
				42	bool conjugate{ false }; /*< Flag to conjugate the output/ /
				43	};
				44
				45	/** Descriptor used by the FFT core kernels */
				46	struct FFTRadixStageKernelInfo
				47	{
				48	unsigned int axis{ 0 }; /*< Axis to run the kernel on. /
Georgios Pinitas	0bc7849	2019-03-18 20:07:37 +0000	[diff] [blame]	49	unsigned int radix{ 0 }; /*< Radix to use. /
				50	unsigned int Nx{ 0 }; /*< Nx coefficient. /
				51	bool is_first_stage{ false }; /*< Flags if the FFT kernels is the first stage of a decomposed FFT. /
				52	};
Gian Marco Iodice	7026b30	2019-06-26 17:18:11 +0100	[diff] [blame]	53
				54	/** Descriptor used by the GEMM kernels */
				55	struct GEMMKernelInfo
				56	{
Gian Marco Iodice	ca1f460	2019-07-16 15:46:48 +0100	[diff] [blame]	57	unsigned int m{ 0 }; /*< Number of LHS rows/
				58	unsigned int n{ 0 }; /*< Number of RHS columns/
				59	unsigned int k{ 0 }; /*< Number of LHS columns or RHS rows /
				60	unsigned int depth_output_gemm3d{ 0 }; /*< Depth of the output tensor in case is reinterpreted as 3D /
				61	bool reinterpret_input_as_3d{ false }; /*< Flag used to reinterpret the input as 3D /
				62	bool broadcast_bias{ false }; /*< Flag used to broadcase the bias addition /
Georgios Pinitas	c370c75	2019-09-12 12:26:11 +0100	[diff] [blame]	63	bool fp_mixed_precision{ false }; /*< Flag used to indicate wider accumulators (32 bit instead of 16 for FP16). /
Gian Marco Iodice	ca1f460	2019-07-16 15:46:48 +0100	[diff] [blame]	64	ActivationLayerInfo activation_info{}; /*< Activation function to perform after the matrix multiplication /
Gian Marco Iodice	7026b30	2019-06-26 17:18:11 +0100	[diff] [blame]	65	};
Gian Marco Iodice	9285adb	2019-09-05 16:10:27 +0100	[diff] [blame]	66
				67	/** Descriptor used by the depthwise convolution kernels */
				68	struct DWCKernelInfo
				69	{
				70	ActivationLayerInfo activation_info{}; /*< Activation function to perform after the depthwise convolution /
				71	};
				72
				73	/** Descriptor used by the depthwise convolution kernels to retrieve the number of output elements processed by each thread */
				74	struct DWCWeightsKernelInfo
				75	{
				76	unsigned int n0{ 0 }; /*< Number of columns processed by each thread /
				77	};
Sang-Hoon Park	62eeb53	2019-10-29 13:13:19 +0000	[diff] [blame]	78
				79	/** Descriptor used by the softmax kernels */
				80	struct SoftmaxKernelInfo
				81	{
Sang-Hoon Park	0779fec	2019-11-13 17:08:12 +0000	[diff] [blame]	82	float beta{ 1.f }; /*< A scaling factor for the exponent with default value 1.0 /
				83	bool is_log{ false }; /*< Flag used to perform Log Softmax operation /
				84	DataType input_data_type{ DataType::UNKNOWN }; /*< Input tensor data type /
Sang-Hoon Park	62eeb53	2019-10-29 13:13:19 +0000	[diff] [blame]	85	};
Michele Di Giorgio	4536193	2019-12-19 13:53:44 +0000	[diff] [blame]	86
				87	/** Descriptor used by the direct convolution layer output stage kernels */
				88	struct DirectConvolutionLayerOutputStageKernelInfo
				89	{
				90	int32_t result_fixedpoint_multiplier{ 0 }; /*< Result output stage multiplier used for quantizing /
				91	int32_t result_shift{ 0 }; /*< Result output stage shift used for quantizing /
				92	int32_t result_offset_after_shift{ 0 }; /*< Result offset used for quantizing /
				93	DataType output_data_type{ DataType::UNKNOWN }; /*< Output tensor data type to use if the output is not initialized /
				94	};
Georgios Pinitas	55a687d	2020-01-30 12:00:23 +0000	[diff] [blame^]	95
				96	struct InstanceNormalizationLayerKernelInfo
				97	{
				98	/** Default constructor */
				99	InstanceNormalizationLayerKernelInfo()
				100	: InstanceNormalizationLayerKernelInfo(1.f, 0.f, 1e-12, true)
				101	{
				102	}
				103	/** Constructor
				104	*
				105	* @param[in] gamma The scale scalar value applied to the normalized tensor.
				106	* @param[in] beta The offset scalar value applied to the normalized tensor
				107	* @param[in] epsilon Lower bound value for the normalization.
				108	* @param[in] use_mixed_precision Use mixed precision in case of FP16 execution.
				109	*/
				110	InstanceNormalizationLayerKernelInfo(float gamma, float beta, float epsilon, bool use_mixed_precision)
				111	: gamma(gamma), beta(beta), epsilon(epsilon), use_mixed_precision(use_mixed_precision)
				112	{
				113	}
				114
				115	float gamma; /*< The scale scalar value applied to the normalized tensor. Defaults to 1.0 /
				116	float beta; /*< The offset scalar value applied to the normalized tensor. Defaults to 0.0 /
				117	float epsilon; /*< Lower bound value for the normalization. Defaults to 1e-12 /
				118	bool use_mixed_precision; /*< Use mixed precision in case of FP16 execution. Defaults to true /
				119	};
Georgios Pinitas	0bc7849	2019-03-18 20:07:37 +0000	[diff] [blame]	120	} // namespace arm_compute
Michalis Spyrou	f464337	2019-11-29 16:17:13 +0000	[diff] [blame]	121	#endif /* ARM_COMPUTE_CORE_KERNEL_DESCRIPTORS_H */