src/dynamic_fusion/sketch/gpu/components/cl/ClComponentMatMul.cpp - ml/ComputeLibrary - Gitiles

 /*
  * Copyright (c) 2023-2024 Arm Limited.
  *
  * SPDX-License-Identifier: MIT
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to
  * deal in the Software without restriction, including without limitation the
  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
  * sell copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in all
  * copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  * SOFTWARE.
  */

 #include "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentMatMul.h"

 #include "arm_compute/core/utils/misc/ShapeCalculator.h"
 #include "arm_compute/core/Validate.h"
 #include "arm_compute/dynamic_fusion/sketch/attributes/MatMulAttributes.h"

 #include "src/core/CL/CLValidate.h"
 #include "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwMatMul.h"
 #include "src/gpu/cl/kernels/helpers/MatMulKernelHelpers.h"

 namespace arm_compute
 {
 namespace experimental
 {
 namespace dynamic_fusion
 {
 namespace
 {
 using Attributes = MatMulAttributes;
 using Settings   = GpuMatMulSettings;

 Status validate_matmul_kernel_info(Attributes attributes, Settings settings)
 {
     const bool adj_lhs = attributes.adj_lhs();
     const bool adj_rhs = attributes.adj_rhs();
     const int  m0      = settings.m0();
     const int  n0      = settings.n0();
     const int  k0      = settings.k0();

     // Validate M0
     ARM_COMPUTE_RETURN_ERROR_ON_MSG(m0 < 1, "Only positive integers are supported for M0");

     if (adj_lhs)
     {
         ARM_COMPUTE_RETURN_ERROR_ON_MSG(((m0 & (m0 - 1)) && (m0 != 3)) || (m0 > 16),
                                         "Only 1,2,3,4,8,16 are supported for M0 for Lhs transposed");
     }

     // Validate N0
     ARM_COMPUTE_RETURN_ERROR_ON_MSG(n0 < 1, "Only positive integers are supported for N0");
     ARM_COMPUTE_RETURN_ERROR_ON_MSG(((n0 & (n0 - 1)) && (n0 != 3)) || (n0 > 16),
                                     "Only 1,2,3,4,8,16 are supported for N0");

     // Validate K0
     ARM_COMPUTE_RETURN_ERROR_ON_MSG(k0 < 1, "Only positive integers are supported for K0");
     if (!adj_lhs || adj_rhs)
     {
         ARM_COMPUTE_RETURN_ERROR_ON_MSG(((k0 & (k0 - 1)) && (k0 != 3)) || (k0 > 16),
                                         "Only 1,2,3,4,8,16 are supported for K0");
     }

     return Status{};
 }

 } // namespace

 Status ClComponentMatMul::validate(const Properties                &properties,
                                    const ArgumentPack<ITensorInfo> &tensors,
                                    const Attributes                &attributes,
                                    const Settings                  &settings)
 {
     ARM_COMPUTE_UNUSED(properties);
     ARM_COMPUTE_UNUSED(attributes);

     const auto lhs = tensors.get_const_tensor(TensorType::ACL_SRC_0);
     const auto rhs = tensors.get_const_tensor(TensorType::ACL_SRC_1);
     const auto dst = tensors.get_const_tensor(TensorType::ACL_DST_0);

     // Currently, the only supported case is when adj_lhs = false and adj_rhs = true
     ARM_COMPUTE_RETURN_ERROR_ON((attributes.adj_lhs() != false) && (attributes.adj_rhs() != true));

     // Check if Matching data type
     ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(lhs, rhs);
     ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(lhs, dst);

     // Data type
     ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(lhs, 1, DataType::F16, DataType::F32);
     ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(lhs, dst);

     // All tensor infos are initialized
     ARM_COMPUTE_RETURN_ERROR_ON(lhs->tensor_shape().total_size() == 0);
     ARM_COMPUTE_RETURN_ERROR_ON(rhs->tensor_shape().total_size() == 0);
     ARM_COMPUTE_RETURN_ERROR_ON(dst->tensor_shape().total_size() == 0);

     // Device requirements are met
     ARM_COMPUTE_RETURN_ERROR_ON_F16_UNSUPPORTED(lhs);

     // Check if block sizes are supported
     MatMulKernelInfo matmul_kernel_info =
         MatMulKernelInfo(attributes.adj_lhs(), attributes.adj_rhs(), settings.m0(), settings.n0(), settings.k0());
     ARM_COMPUTE_RETURN_ON_ERROR(validate_matmul_kernel_info(attributes, settings));
     ARM_COMPUTE_RETURN_ON_ERROR(
         opencl::kernels::validate_matmul_input_shapes(lhs->tensor_shape(), rhs->tensor_shape(), matmul_kernel_info));

     // Check if dst shape is correct
     const auto expected_dst_shape =
         misc::shape_calculator::compute_matmul_shape(lhs->tensor_shape(), rhs->tensor_shape(), matmul_kernel_info);
     ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DIMENSIONS(dst->tensor_shape(), expected_dst_shape);

     return Status{};
 }

 ClComponentMatMul::ClComponentMatMul(ComponentId                      id,
                                      const Properties                &properties,
                                      const ArgumentPack<ITensorInfo> &tensors,
                                      const Attributes                &attributes,
                                      const Settings                  &settings)
     : IGpuKernelComponent{id, properties, tensors},
       _component_writer{std::make_unique<GpuCkwMatMul>(id, tensors, attributes, settings)}
 {
 }

 ClComponentMatMul::~ClComponentMatMul()
 {
 }

 const IGpuCkwComponentDriver *ClComponentMatMul::ckw_component_driver() const
 {
     return _component_writer.get();
 }

 } // namespace dynamic_fusion
 } // namespace experimental
 } // namespace arm_compute
	/*
	* Copyright (c) 2023-2024 Arm Limited.
	*
	* SPDX-License-Identifier: MIT
	*
	* Permission is hereby granted, free of charge, to any person obtaining a copy
	* of this software and associated documentation files (the "Software"), to
	* deal in the Software without restriction, including without limitation the
	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
	* sell copies of the Software, and to permit persons to whom the Software is
	* furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice shall be included in all
	* copies or substantial portions of the Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
	* SOFTWARE.
	*/

	#include "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentMatMul.h"

	#include "arm_compute/core/utils/misc/ShapeCalculator.h"
	#include "arm_compute/core/Validate.h"
	#include "arm_compute/dynamic_fusion/sketch/attributes/MatMulAttributes.h"

	#include "src/core/CL/CLValidate.h"
	#include "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwMatMul.h"
	#include "src/gpu/cl/kernels/helpers/MatMulKernelHelpers.h"

	namespace arm_compute
	{
	namespace experimental
	{
	namespace dynamic_fusion
	{
	namespace
	{
	using Attributes = MatMulAttributes;
	using Settings = GpuMatMulSettings;

	Status validate_matmul_kernel_info(Attributes attributes, Settings settings)
	{
	const bool adj_lhs = attributes.adj_lhs();
	const bool adj_rhs = attributes.adj_rhs();
	const int m0 = settings.m0();
	const int n0 = settings.n0();
	const int k0 = settings.k0();

	// Validate M0
	ARM_COMPUTE_RETURN_ERROR_ON_MSG(m0 < 1, "Only positive integers are supported for M0");

	if (adj_lhs)
	{
	ARM_COMPUTE_RETURN_ERROR_ON_MSG(((m0 & (m0 - 1)) && (m0 != 3)) \|\| (m0 > 16),
	"Only 1,2,3,4,8,16 are supported for M0 for Lhs transposed");
	}

	// Validate N0
	ARM_COMPUTE_RETURN_ERROR_ON_MSG(n0 < 1, "Only positive integers are supported for N0");
	ARM_COMPUTE_RETURN_ERROR_ON_MSG(((n0 & (n0 - 1)) && (n0 != 3)) \|\| (n0 > 16),
	"Only 1,2,3,4,8,16 are supported for N0");

	// Validate K0
	ARM_COMPUTE_RETURN_ERROR_ON_MSG(k0 < 1, "Only positive integers are supported for K0");
	if (!adj_lhs \|\| adj_rhs)
	{
	ARM_COMPUTE_RETURN_ERROR_ON_MSG(((k0 & (k0 - 1)) && (k0 != 3)) \|\| (k0 > 16),
	"Only 1,2,3,4,8,16 are supported for K0");
	}

	return Status{};
	}

	} // namespace

	Status ClComponentMatMul::validate(const Properties &properties,
	const ArgumentPack<ITensorInfo> &tensors,
	const Attributes &attributes,
	const Settings &settings)
	{
	ARM_COMPUTE_UNUSED(properties);
	ARM_COMPUTE_UNUSED(attributes);

	const auto lhs = tensors.get_const_tensor(TensorType::ACL_SRC_0);
	const auto rhs = tensors.get_const_tensor(TensorType::ACL_SRC_1);
	const auto dst = tensors.get_const_tensor(TensorType::ACL_DST_0);

	// Currently, the only supported case is when adj_lhs = false and adj_rhs = true
	ARM_COMPUTE_RETURN_ERROR_ON((attributes.adj_lhs() != false) && (attributes.adj_rhs() != true));

	// Check if Matching data type
	ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(lhs, rhs);
	ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(lhs, dst);

	// Data type
	ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(lhs, 1, DataType::F16, DataType::F32);
	ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(lhs, dst);

	// All tensor infos are initialized
	ARM_COMPUTE_RETURN_ERROR_ON(lhs->tensor_shape().total_size() == 0);
	ARM_COMPUTE_RETURN_ERROR_ON(rhs->tensor_shape().total_size() == 0);
	ARM_COMPUTE_RETURN_ERROR_ON(dst->tensor_shape().total_size() == 0);

	// Device requirements are met
	ARM_COMPUTE_RETURN_ERROR_ON_F16_UNSUPPORTED(lhs);

	// Check if block sizes are supported
	MatMulKernelInfo matmul_kernel_info =
	MatMulKernelInfo(attributes.adj_lhs(), attributes.adj_rhs(), settings.m0(), settings.n0(), settings.k0());
	ARM_COMPUTE_RETURN_ON_ERROR(validate_matmul_kernel_info(attributes, settings));
	ARM_COMPUTE_RETURN_ON_ERROR(
	opencl::kernels::validate_matmul_input_shapes(lhs->tensor_shape(), rhs->tensor_shape(), matmul_kernel_info));

	// Check if dst shape is correct
	const auto expected_dst_shape =
	misc::shape_calculator::compute_matmul_shape(lhs->tensor_shape(), rhs->tensor_shape(), matmul_kernel_info);
	ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DIMENSIONS(dst->tensor_shape(), expected_dst_shape);

	return Status{};
	}

	ClComponentMatMul::ClComponentMatMul(ComponentId id,
	const Properties &properties,
	const ArgumentPack<ITensorInfo> &tensors,
	const Attributes &attributes,
	const Settings &settings)
	: IGpuKernelComponent{id, properties, tensors},
	_component_writer{std::make_unique<GpuCkwMatMul>(id, tensors, attributes, settings)}
	{
	}

	ClComponentMatMul::~ClComponentMatMul()
	{
	}

	const IGpuCkwComponentDriver *ClComponentMatMul::ckw_component_driver() const
	{
	return _component_writer.get();
	}

	} // namespace dynamic_fusion
	} // namespace experimental
	} // namespace arm_compute