Blame - src/cpu/operators/internal/CpuGemmAssemblyDispatch.h - ml/ComputeLibrary

blob: 588c45294a4f2e6408633adde38db6dffa2b7833 [file] [log] [blame]

Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	1	/*
Mohammed Suhail Munshi	a1b1e41	2023-03-23 22:21:31 +0000	[diff] [blame^]	2	* Copyright (c) 2018-2023 Arm Limited.
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	3	*
				4	* SPDX-License-Identifier: MIT
				5	*
				6	* Permission is hereby granted, free of charge, to any person obtaining a copy
				7	* of this software and associated documentation files (the "Software"), to
				8	* deal in the Software without restriction, including without limitation the
				9	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
				10	* sell copies of the Software, and to permit persons to whom the Software is
				11	* furnished to do so, subject to the following conditions:
				12	*
				13	* The above copyright notice and this permission notice shall be included in all
				14	* copies or substantial portions of the Software.
				15	*
				16	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				17	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				18	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
				19	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				20	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				21	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				22	* SOFTWARE.
				23	*/
Sang-Hoon Park	d89e2fa	2021-05-17 17:04:50 +0100	[diff] [blame]	24	#ifndef ARM_COMPUTE_CPU_INTERNAL_CPU_GEMM_ASSEMBLY_DISPATCH_H
				25	#define ARM_COMPUTE_CPU_INTERNAL_CPU_GEMM_ASSEMBLY_DISPATCH_H
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	26
Sang-Hoon Park	d89e2fa	2021-05-17 17:04:50 +0100	[diff] [blame]	27	#include "src/core/common/Macros.h"
Georgios Pinitas	7891a73	2021-08-20 21:39:25 +0100	[diff] [blame]	28	#include "src/cpu/ICpuOperator.h"
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	29
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	30	namespace arm_compute
				31	{
Sang-Hoon Park	4f7693d	2021-05-12 13:59:10 +0100	[diff] [blame]	32	namespace cpu
				33	{
Georgios Pinitas	c0b6f76	2020-11-02 01:37:17 +0000	[diff] [blame]	34	/* Convolution method supported by the assembly gemm interface */
				35	enum class AsmConvMethod
				36	{
				37	Im2Col,
				38	Indirect,
				39	Conv
				40	};
				41
				42	struct AsmGemmInfo
				43	{
Ramy Elgammal	9178002	2022-07-20 14:57:37 +0100	[diff] [blame]	44	AsmConvMethod method{ AsmConvMethod::Im2Col };
				45	PadStrideInfo ps_info{};
				46	ActivationLayerInfo activation_info{};
				47	GEMMLowpOutputStageInfo output_stage{};
				48	bool negated_offsets{ true };
				49	bool reinterpret_input_as_3d{ false };
				50	bool depth_output_gemm3d{ false };
				51	int64_t padding_top{ 0 };
				52	int64_t padding_left{ 0 };
				53	float padding_value{ 0.f };
				54	bool fast_mode{ false };
				55	bool fixed_format{ false };
				56	arm_compute::WeightFormat weight_format{ arm_compute::WeightFormat::UNSPECIFIED };
Mohammed Suhail Munshi	4b5f6ef	2022-10-21 11:15:54 +0100	[diff] [blame]	57	bool reshape_b_only_on_first_run{ true };
Georgios Pinitas	c0b6f76	2020-11-02 01:37:17 +0000	[diff] [blame]	58	};
				59
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	60	/** Assembly kernel glue */
Sang-Hoon Park	d89e2fa	2021-05-17 17:04:50 +0100	[diff] [blame]	61	class CpuGemmAssemblyDispatch : public ICpuOperator
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	62	{
				63	public:
Michalis Spyrou	1a569a3	2019-09-10 17:20:34 +0100	[diff] [blame]	64	/** Constructor */
Michele Di Giorgio	d7316eb	2021-06-16 11:14:41 +0100	[diff] [blame]	65	CpuGemmAssemblyDispatch();
Sang-Hoon Park	4f7693d	2021-05-12 13:59:10 +0100	[diff] [blame]	66	/** Defautl destructor */
				67	~CpuGemmAssemblyDispatch() = default;
Anthony Barbier	eaefd00	2018-07-20 17:49:35 +0100	[diff] [blame]	68
Sang-Hoon Park	d89e2fa	2021-05-17 17:04:50 +0100	[diff] [blame]	69	ARM_COMPUTE_DISALLOW_COPY_ALLOW_MOVE(CpuGemmAssemblyDispatch);
				70
Anthony Barbier	eaefd00	2018-07-20 17:49:35 +0100	[diff] [blame]	71	class IFallback
				72	{
				73	public:
Ramy Elgammal	9178002	2022-07-20 14:57:37 +0100	[diff] [blame]	74	virtual void run(ITensorPack &tensors) = 0;
				75	virtual void prepare(ITensorPack &tensors) = 0;
				76	virtual experimental::MemoryRequirements workspace() const = 0;
				77	virtual bool is_configured() const = 0;
				78	virtual bool isVarWeightsKernel() const = 0;
				79	virtual ~IFallback() = default;
Anthony Barbier	eaefd00	2018-07-20 17:49:35 +0100	[diff] [blame]	80	};
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	81
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	82	public:
Michele Di Giorgio	57f30a9	2020-09-08 14:03:51 +0100	[diff] [blame]	83	/** If supported create a Compute Library function else fallback to the arm_gemm function.
Anthony Barbier	c8e84b5	2018-07-17 16:48:42 +0100	[diff] [blame]	84	*
Mohammed Suhail Munshi	a1b1e41	2023-03-23 22:21:31 +0000	[diff] [blame^]	85	* @note Configuring "batches"
				86	* The shapes of @p a @p b and @p d are arranged as follows:
				87	* Lowest dimension <-> Highest dimension
				88	* a: [K, M, Batch, Multi]
				89	* b: [N, K, Multi]
				90	* d: [N, M, Batch, Multi]
				91	*
				92	* The "Batch" refers to where "Batch" number of MxK slices of tensor a multiplies with a single KxN slice of b
				93	* The "Multi" refers to where "Multi" number of individual multiplication of a with b
				94	*
				95	* E.g. the following are some example input shape configurations
				96	*
				97	* (1) Normal 2D gemm
				98	* a: [K=3, M=4]
				99	* b: [N=5, K=3]
				100	* d: [N=5, M=4]
				101	*
				102	* (2) Batches of a sharing b (e.g. gemm-based batched convolution where b is the shared )
				103	* a: [K=3, M=4, Batch=9]
				104	* b: [N=5, K=3]
				105	* d: [N=5, M=4, Batch=9]
				106	*
				107	* (3) "Batches" of independent gemm (e.g. batched matmul)
				108	* a: [K=3, M=4, Batch=1, Multi=7]
				109	* b: [N=5, K=3, Multi=7]
				110	* d: [N=5, M=4, Batch=1, Multi=7]
				111	*
				112	* (4) "Batches" of independent gemm where b is also shared
				113	* a: [K=3, M=4, Batch=4, Multi=7]
				114	* b: [N=5, K=3, Multi=7]
				115	* d: [N=5, M=4, Batch=4, Multi=7]
				116	*
Georgios Pinitas	c0b6f76	2020-11-02 01:37:17 +0000	[diff] [blame]	117	* @param[in] a Input tensor (Matrix A)
				118	* @param[in] b Input tensor (Matrix B)
				119	* @param[in] c Input tensor (Matrix C) used to pass the bias for quantized calculations
				120	* @param[out] d Output tensor to store the result of matrix multiplication. Data type supported: same as @p input0.
				121	* @param[in] info GEMM meta-data
Anthony Barbier	c8e84b5	2018-07-17 16:48:42 +0100	[diff] [blame]	122	*/
Sang-Hoon Park	d89e2fa	2021-05-17 17:04:50 +0100	[diff] [blame]	123	void configure(const ITensorInfo a, const ITensorInfo b, const ITensorInfo c, ITensorInfo d, const AsmGemmInfo &info);
Anthony Barbier	eaefd00	2018-07-20 17:49:35 +0100	[diff] [blame]	124
				125	/** Indicates whether or not this function can be used to process the given parameters.
				126	*
Georgios Pinitas	c0b6f76	2020-11-02 01:37:17 +0000	[diff] [blame]	127	* @param[in] a Input tensor info (Matrix A)
				128	* @param[in] b Input tensor info (Matrix B)
				129	* @param[in] c Input tensor info (Matrix C) used to pass the bias for quantized calculations
				130	* @param[in] d Output tensor to store the result of matrix multiplication. Data type supported: same as @p input0.
				131	* @param[in] info GEMM meta-data
Anthony Barbier	eaefd00	2018-07-20 17:49:35 +0100	[diff] [blame]	132	*
				133	* @return a status.
				134	*/
Georgios Pinitas	c0b6f76	2020-11-02 01:37:17 +0000	[diff] [blame]	135	static Status validate(const ITensorInfo a, const ITensorInfo b, const ITensorInfo c, const ITensorInfo d, const AsmGemmInfo &info);
Francesco.Petrogalli@arm.com	e33c556	2022-03-31 17:55:35 +0000	[diff] [blame]	136
				137	/** Indicates whether or not there is an optimal assembly implementation that can be used to process the given parameters.
				138	*
Francesco Petrogalli	553f695	2022-06-30 10:22:01 +0000	[diff] [blame]	139	* This method has the same use of @ref
				140	* NEGEMMConvolutionLayer::has_opt_impl, with the only caveat that
Ramy Elgammal	9178002	2022-07-20 14:57:37 +0100	[diff] [blame]	141	* the value of arm_compute::WeightFormat need to be passed via the
Francesco Petrogalli	553f695	2022-06-30 10:22:01 +0000	[diff] [blame]	142	* parameter info.
Francesco.Petrogalli@arm.com	e33c556	2022-03-31 17:55:35 +0000	[diff] [blame]	143	*
				144	* @return a status.
				145	*/
Ramy Elgammal	9178002	2022-07-20 14:57:37 +0100	[diff] [blame]	146	static Status has_opt_impl(arm_compute::WeightFormat &weight_format, const ITensorInfo a, const ITensorInfo b, const ITensorInfo c, const ITensorInfo d, const AsmGemmInfo &info);
Georgios Pinitas	48b3ef8	2019-10-14 19:03:09 +0100	[diff] [blame]	147	/** Checks if activation is supported by the gemm assembly dispatcher
				148	*
				149	* @param[in] activation Activation to check
				150	*
				151	* @return True if activation is supported else false
				152	*/
				153	static bool is_activation_supported(const ActivationLayerInfo &activation);
Anthony Barbier	c8e84b5	2018-07-17 16:48:42 +0100	[diff] [blame]	154	/** Was the function successfully configured ?
				155	*
				156	* @return True if the function is configured and ready to run
				157	*/
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	158	bool is_configured() const;
Francesco Petrogalli	553f695	2022-06-30 10:22:01 +0000	[diff] [blame]	159	/** Indicates if the convolution executes in variable weights mode.
				160	*
				161	* Similar to @ref CpuGemm::isVarWeightsKernel
				162	*/
				163	bool isVarWeightsKernel() const
				164	{
				165	return _arm_gemm && _arm_gemm->isVarWeightsKernel();
				166	}
Georgios Pinitas	c0b6f76	2020-11-02 01:37:17 +0000	[diff] [blame]	167
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	168	// Inherited methods overridden:
Ramy Elgammal	9178002	2022-07-20 14:57:37 +0100	[diff] [blame]	169	void prepare(ITensorPack &tensors) override;
				170	void run(ITensorPack &tensors) override;
Michele Di Giorgio	d7316eb	2021-06-16 11:14:41 +0100	[diff] [blame]	171	experimental::MemoryRequirements workspace() const override;
Georgios Pinitas	c0b6f76	2020-11-02 01:37:17 +0000	[diff] [blame]	172
				173	private:
Michele Di Giorgio	d7316eb	2021-06-16 11:14:41 +0100	[diff] [blame]	174	std::unique_ptr<IFallback> _arm_gemm; /*< Interface for the arm_gemm fallback /
Anthony Barbier	71d9b57	2018-07-06 17:05:59 +0100	[diff] [blame]	175	};
Sang-Hoon Park	4f7693d	2021-05-12 13:59:10 +0100	[diff] [blame]	176	} // namespace cpu
Anthony Barbier	c8e84b5	2018-07-17 16:48:42 +0100	[diff] [blame]	177	} // namespace arm_compute
Sang-Hoon Park	d89e2fa	2021-05-17 17:04:50 +0100	[diff] [blame]	178	#endif /* ARM_COMPUTE_CPU_INTERNAL_CPU_GEMM_ASSEMBLY_DISPATCH_H */