blob: 6ba5b1db93c875f5e61406278ba1219c9956758b [file] [log] [blame]
/*
* Copyright (c) 2023 Arm Limited.
*
* SPDX-License-Identifier: MIT
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to
* deal in the Software without restriction, including without limitation the
* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
* sell copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in all
* copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*/
#ifndef ACL_ARM_COMPUTE_DYNAMIC_FUSION_SKETCH_GPU_OPERATORS_GPUMATMUL_H
#define ACL_ARM_COMPUTE_DYNAMIC_FUSION_SKETCH_GPU_OPERATORS_GPUMATMUL_H
#include "arm_compute/core/Error.h"
#include "arm_compute/core/KernelDescriptors.h"
#include "arm_compute/dynamic_fusion/sketch/attributes/MatMulAttributes.h"
namespace arm_compute
{
namespace experimental
{
namespace dynamic_fusion
{
/** Forward declaration */
class GpuWorkloadContext;
class GpuWorkloadSketch;
/** Operator backend specific settings
*/
class GpuMatMulSettings
{
public:
/** Set N0: number of columns processed by each work-item */
GpuMatMulSettings &n0(int n0);
/** Get N0: number of columns processed by each work-item */
int n0() const;
/** Set M0: number of rows processed by each work-item */
GpuMatMulSettings &m0(int m0);
/** Get M0: number of rows processed by each work-item */
int m0() const;
/** Set K0: number of inner accumulations */
GpuMatMulSettings &k0(int k0);
/** Get K0: number of inner accumulations */
int k0() const;
private:
int _n0{0}; /**< Number of columns processed by each work-item */
int _m0{0}; /**< Number of rows processed by each work-item */
int _k0{0}; /**< Number of inner accumulations */
};
/** Operator interface. */
class GpuMatMul final
{
public:
/* Attributes are a set of backend-agnostic parameters that define what an operator does */
using Attributes = MatMulAttributes;
/* Settings are a set of backend-specific parameters that influence the implementation of a operator */
using Settings = GpuMatMulSettings;
/* Create an operator and fuse it into the workload sketch.
* @note If @ref validate_op() fails, the creation also fails and may throw an error.
* @note If @ref validate_op() fails, @p sketch remains unchanged and valid.
*
* Valid data type configurations:
* |LHS |RHS |dst |
* |:--------------|:--------------|:--------------|
* |F16 |F16 |F16 |
* |F32 |F32 |F32 |
*
*
* @param[in,out] sketch Workload sketch into which the operator will be fused
* @param[in] lhs Input tensor info for the LHS matrix. Data type supported: F32/F16. Dimensions above 2 are collapsed onto dimension 2 and represent the batch.
* @param[in] rhs Input tensor info for the RHS matrix. Data type supported: same as @p lhs. Dimensions above 2 are collapsed onto dimension 2 and represent the batch.
* @param[in] attributes Operator attributes
* @param[in] settings Operator settings
*
* @return Pointer for the destination tensor info
*/
static ITensorInfo *create_op(GpuWorkloadSketch &sketch,
ITensorInfo *lhs,
ITensorInfo *rhs,
const Attributes &attributes,
const Settings &settings);
/* Check if the operator configuration is supported, irrespective of fusion
*
* @param[in] context Workload context within which the operator is running
* @param[in] lhs Input tensor info for the LHS matrix.
* @param[in] rhs Input tensor info for the RHS matrix.
* @param[in] attributes Operator attributes
* @param[in] settings Operator settings
*
* @return Status
*/
static Status is_supported_op(const GpuWorkloadContext &context,
const ITensorInfo *lhs,
const ITensorInfo *rhs,
const Attributes &attributes,
const Settings &settings);
/* Check if the operator configuration is supported and if it can be fused into the workload sketch.
*
* Parameters are similar to @ref GpuMatMul::create_op()
*
* @return Status
*/
static Status validate_op(const GpuWorkloadSketch &sketch,
const ITensorInfo *lhs,
const ITensorInfo *rhs,
const Attributes &attributes,
const Settings &settings);
};
} // namespace dynamic_fusion
} // namespace experimental
} // namespace arm_compute
#endif // ACL_ARM_COMPUTE_DYNAMIC_FUSION_SKETCH_GPU_OPERATORS_GPUMATMUL_H