tests/validation/NEON/ArithmeticAddition.cpp - ml/ComputeLibrary - Gitiles

 /*
  * Copyright (c) 2017-2023 Arm Limited.
  *
  * SPDX-License-Identifier: MIT
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to
  * deal in the Software without restriction, including without limitation the
  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
  * sell copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in all
  * copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  * SOFTWARE.
  */
 #include "arm_compute/core/Types.h"
 #include "arm_compute/core/utils/StringUtils.h"
 #include "arm_compute/runtime/NEON/functions/NEArithmeticAddition.h"
 #include "arm_compute/runtime/Tensor.h"
 #include "arm_compute/runtime/TensorAllocator.h"
 #include "src/common/cpuinfo/CpuIsaInfo.h"
 #include "src/cpu/kernels/CpuAddKernel.h"
 #include "tests/NEON/Accessor.h"
 #include "tests/PaddingCalculator.h"
 #include "tests/datasets/ConvertPolicyDataset.h"
 #include "tests/datasets/ShapeDatasets.h"
 #include "tests/framework/Asserts.h"
 #include "tests/framework/Macros.h"
 #include "tests/framework/datasets/Datasets.h"
 #include "tests/validation/Validation.h"
 #include "tests/validation/fixtures/ArithmeticOperationsFixture.h"

 namespace arm_compute
 {
 namespace test
 {
 namespace validation
 {
 namespace
 {
 #if !defined(__aarch64__) || defined(ENABLE_SVE)
 constexpr AbsoluteTolerance<float> tolerance_quant(1); /**< Tolerance value for comparing reference's output against implementation's output for quantized data types */
 #else                                                  // !defined(__aarch64__) || defined(ENABLE_SVE)
 constexpr AbsoluteTolerance<float> tolerance_quant(0);
 #endif                                                 // !defined(__aarch64__) || defined(ENABLE_SVE)
 const auto InPlaceDataSet    = framework::dataset::make("InPlace", { false, true });
 const auto OutOfPlaceDataSet = framework::dataset::make("InPlace", { false });
 } // namespace

 TEST_SUITE(NEON)
 TEST_SUITE(ArithmeticAddition)

 template <typename T>
 using NEArithmeticAdditionFixture = ArithmeticAdditionValidationFixture<Tensor, Accessor, NEArithmeticAddition, T>;

 // *INDENT-OFF*
 // clang-format off
 DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(zip(
                framework::dataset::make("Input1Info", { TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::F32),
                                                         TensorInfo(TensorShape(27U, 13U, 2U), 1, DataType::U8), // Unsupported broadcast
                                                         TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::U8), // Invalid data type combination
                                                         TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::F32),// Mismatching shapes
                                                       }),
                framework::dataset::make("Input2Info",{ TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::F32),
                                                        TensorInfo(TensorShape(1U, 13U, 2U), 1, DataType::S16),
                                                        TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::S16),
                                                        TensorInfo(TensorShape(48U, 11U, 2U), 1, DataType::F32),
                                                      })),
                framework::dataset::make("OutputInfo",{ TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::F32),
                                                        TensorInfo(TensorShape(27U, 13U, 2U), 1, DataType::S16),
                                                        TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::U8),
                                                        TensorInfo(TensorShape(48U, 11U, 2U), 1, DataType::F32),
                                                      })),
                framework::dataset::make("Expected", { true, false, false, false})),
                input1_info, input2_info, output_info, expected)
 {
     Status s = NEArithmeticAddition::validate(&input1_info.clone()->set_is_resizable(false),
                                               &input2_info.clone()->set_is_resizable(false),
                                               &output_info.clone()->set_is_resizable(false),
                                               ConvertPolicy::WRAP);
     ARM_COMPUTE_EXPECT(bool(s) == expected, framework::LogLevel::ERRORS);
 }

 DATA_TEST_CASE(KernelSelection, framework::DatasetMode::ALL, concat(concat(
                 combine(combine(framework::dataset::make("CpuExt", std::string("NEON")),
                        framework::dataset::make("DataType", { DataType::F32,
                                                               DataType::F16,
                                                               DataType::U8,
                                                               DataType::S16,
                                                               DataType::S32,
                                                               DataType::QASYMM8,
                                                               DataType::QASYMM8_SIGNED,
                                                               DataType::QSYMM16
                                                             })),
                         framework::dataset::make("CanUseFixedpoint", {true, false})),
                 combine(combine(framework::dataset::make("CpuExt", std::string("SVE")),
                         framework::dataset::make("DataType", { DataType::F32,
                                                                DataType::F16,
                                                                DataType::U8,
                                                                DataType::S16,
                                                                DataType::S32
                                                              })),
                         framework::dataset::make("CanUseFixedpoint", {true, false}))),
                 combine(combine(framework::dataset::make("CpuExt", std::string("SVE2")),
                         framework::dataset::make("DataType", { DataType::QASYMM8,
                                                                DataType::QASYMM8_SIGNED,
                                                                DataType::QSYMM16
                                                              })),
                         framework::dataset::make("CanUseFixedpoint", {true, false}))),
                cpu_ext, data_type, can_use_fixedpoint)
 {
     using namespace cpu::kernels;

     cpuinfo::CpuIsaInfo cpu_isa{};
     cpu_isa.neon = (cpu_ext == "NEON");
     cpu_isa.sve  = (cpu_ext == "SVE");
     cpu_isa.sve2 = (cpu_ext == "SVE2");
     cpu_isa.fp16 = (data_type == DataType::F16);

     const auto *selected_impl = CpuAddKernel::get_implementation(CpuAddKernelDataTypeISASelectorData{data_type, cpu_isa, can_use_fixedpoint}, cpu::KernelSelectionType::Preferred);

     ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);

     bool qasymm8_any = (data_type == DataType::QASYMM8 || data_type == DataType::QASYMM8_SIGNED);

     std::string expected;
     if(qasymm8_any && can_use_fixedpoint)
     {
         expected = "neon_" + cpu_impl_dt(data_type) + "_add_fixedpoint";
     }
     else
     {
         expected = lower_string(cpu_ext) + "_" + cpu_impl_dt(data_type) + "_add";
     }

     std::string actual   = selected_impl->name;

     ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
 }
 // clang-format on
 // *INDENT-ON*

 TEST_CASE(NoPaddingAdded, framework::DatasetMode::PRECOMMIT)
 {
     // NEArithmeticAddition doesn't use padding, so make sure this is the case.
     Tensor input1 = create_tensor<Tensor>(TensorShape(15U, 15U), DataType::F32);
     Tensor input2 = create_tensor<Tensor>(TensorShape(15U, 1U), DataType::F32);
     Tensor output = create_tensor<Tensor>(TensorShape(15U, 15U), DataType::F32);

     NEArithmeticAddition add;
     add.configure(&input1, &input2, &output, ConvertPolicy::WRAP);

     // Validate padding is zero
     validate(input1.info()->padding(), PaddingSize());
     validate(input2.info()->padding(), PaddingSize());
     validate(output.info()->padding(), PaddingSize());
 }

 TEST_SUITE(Integer)
 TEST_SUITE(U8)
 FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<uint8_t>, framework::DatasetMode::PRECOMMIT, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType",
                                                                                                                   DataType::U8)),
                                                                                                                   framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                                                                                                                   OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }
 TEST_SUITE_END() // U8

 TEST_SUITE(S16)
 FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<int16_t>, framework::DatasetMode::PRECOMMIT, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType",
                                                                                                                   DataType::S16)),
                                                                                                                   framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                                                                                                                   OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }

 FIXTURE_DATA_TEST_CASE(RunLarge, NEArithmeticAdditionFixture<int16_t>, framework::DatasetMode::NIGHTLY, combine(combine(combine(datasets::LargeShapes(), framework::dataset::make("DataType",
                                                                                                                         DataType::S16)),
                                                                                                                         framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                                                                                                                 OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }
 TEST_SUITE_END() // S16

 TEST_SUITE(S32)
 FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<int32_t>, framework::DatasetMode::ALL, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType",
                                                                                                                     DataType::S32)),
                                                                                                                     framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                                                                                                             OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }
 TEST_SUITE_END() // S32
 TEST_SUITE_END() // Integer

 TEST_SUITE(Float)
 #ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
 TEST_SUITE(F16)
 FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<half>, framework::DatasetMode::ALL, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType", DataType::F16)),
                                                                                                                  framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                                                                                                          OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }
 TEST_SUITE_END() // F16
 #endif           /* __ARM_FEATURE_FP16_VECTOR_ARITHMETIC */

 TEST_SUITE(F32)
 FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<float>, framework::DatasetMode::PRECOMMIT, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType",
                                                                                                                         DataType::F32)),
                                                                                                                         framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                                                                                                                 OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }

 FIXTURE_DATA_TEST_CASE(RunLarge, NEArithmeticAdditionFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(datasets::LargeShapes(), framework::dataset::make("DataType",
                                                                                                                       DataType::F32)),
                                                                                                                       framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                                                                                                               OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }

 template <typename T>
 using NEArithmeticAdditionBroadcastFixture = ArithmeticAdditionBroadcastValidationFixture<Tensor, Accessor, NEArithmeticAddition, T>;

 FIXTURE_DATA_TEST_CASE(RunSmallBroadcast, NEArithmeticAdditionBroadcastFixture<float>, framework::DatasetMode::PRECOMMIT, combine(combine(combine(datasets::SmallShapesBroadcast(),
                        framework::dataset::make("DataType", DataType::F32)),
                        framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                        OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }

 FIXTURE_DATA_TEST_CASE(RunLargeBroadcast, NEArithmeticAdditionBroadcastFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(datasets::LargeShapesBroadcast(),
                        framework::dataset::make("DataType", DataType::F32)),
                        framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
                        OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference);
 }
 TEST_SUITE_END() // F32
 TEST_SUITE_END() // Float

 template <typename T>
 using NEArithmeticAdditionQuantizedFixture = ArithmeticAdditionValidationQuantizedFixture<Tensor, Accessor, NEArithmeticAddition, T>;

 template <typename T>
 using NEArithmeticAdditionQuantizedBroadcastFixture = ArithmeticAdditionValidationQuantizedBroadcastFixture<Tensor, Accessor, NEArithmeticAddition, T>;

 TEST_SUITE(Quantized)
 TEST_SUITE(QASYMM8)
 FIXTURE_DATA_TEST_CASE(RunSmall,
                        NEArithmeticAdditionQuantizedFixture<uint8_t>,
                        framework::DatasetMode::PRECOMMIT,
                        combine(combine(combine(combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType", DataType::QASYMM8)),
                                                                framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE })),
                                                        framework::dataset::make("Src0QInfo", { QuantizationInfo(5.f / 255.f, 20) })),
                                                framework::dataset::make("Src1QInfo", { QuantizationInfo(2.f / 255.f, 10) })),
                                        framework::dataset::make("OutQInfo", { QuantizationInfo(1.f / 255.f, 5) })),
                                OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference, tolerance_quant);
 }
 TEST_SUITE_END() // QASYMM8

 TEST_SUITE(QASYMM8_SIGNED)
 FIXTURE_DATA_TEST_CASE(RunSmall,
                        NEArithmeticAdditionQuantizedFixture<int8_t>,
                        framework::DatasetMode::ALL,
                        combine(combine(combine(combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED)),
                                                                framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE })),
                                                        framework::dataset::make("Src0QInfo", { QuantizationInfo(0.5f, 20) })),
                                                framework::dataset::make("Src1QInfo", { QuantizationInfo(0.5f, 10) })),
                                        framework::dataset::make("OutQInfo", { QuantizationInfo(0.5f, 5) })),
                                OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference, tolerance_quant);
 }

 FIXTURE_DATA_TEST_CASE(RunSmallBroadcast, NEArithmeticAdditionQuantizedBroadcastFixture<int8_t>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(
                            datasets::SmallShapesBroadcast(), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED)),
                        framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE })),
                        framework::dataset::make("Src0QInfo", { QuantizationInfo(0.5f, 20) })),
                        framework::dataset::make("Src1QInfo", { QuantizationInfo(0.5f, 10) })),
                        framework::dataset::make("OutQInfo", { QuantizationInfo(0.5f, 5) })),
                        OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference, tolerance_quant);
 }
 TEST_SUITE_END() // QASYMM8_SIGNED

 TEST_SUITE(QSYMM16)
 FIXTURE_DATA_TEST_CASE(RunSmall,
                        NEArithmeticAdditionQuantizedFixture<int16_t>,
                        framework::DatasetMode::PRECOMMIT,
                        combine(combine(combine(combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType", DataType::QSYMM16)),
                                                                framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE })),
                                                        framework::dataset::make("Src0QInfo", { QuantizationInfo(1.f / 32768.f, 0), QuantizationInfo(5.f / 32768.f, 0) })),
                                                framework::dataset::make("Src1QInfo", { QuantizationInfo(2.f / 32768.f, 0), QuantizationInfo(5.f / 32768.f, 0) })),
                                        framework::dataset::make("OutQInfo", { QuantizationInfo(5.f / 32768.f, 0) })),
                                OutOfPlaceDataSet))
 {
     // Validate output
     validate(Accessor(_target), _reference, tolerance_quant);
 }
 TEST_SUITE_END() // QSYMM16
 TEST_SUITE_END() // Quantized

 TEST_SUITE_END() // ArithmeticAddition
 TEST_SUITE_END() // Neon
 } // namespace validation
 } // namespace test
 } // namespace arm_compute
	/*
	* Copyright (c) 2017-2023 Arm Limited.
	*
	* SPDX-License-Identifier: MIT
	*
	* Permission is hereby granted, free of charge, to any person obtaining a copy
	* of this software and associated documentation files (the "Software"), to
	* deal in the Software without restriction, including without limitation the
	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
	* sell copies of the Software, and to permit persons to whom the Software is
	* furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice shall be included in all
	* copies or substantial portions of the Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
	* SOFTWARE.
	*/
	#include "arm_compute/core/Types.h"
	#include "arm_compute/core/utils/StringUtils.h"
	#include "arm_compute/runtime/NEON/functions/NEArithmeticAddition.h"
	#include "arm_compute/runtime/Tensor.h"
	#include "arm_compute/runtime/TensorAllocator.h"
	#include "src/common/cpuinfo/CpuIsaInfo.h"
	#include "src/cpu/kernels/CpuAddKernel.h"
	#include "tests/NEON/Accessor.h"
	#include "tests/PaddingCalculator.h"
	#include "tests/datasets/ConvertPolicyDataset.h"
	#include "tests/datasets/ShapeDatasets.h"
	#include "tests/framework/Asserts.h"
	#include "tests/framework/Macros.h"
	#include "tests/framework/datasets/Datasets.h"
	#include "tests/validation/Validation.h"
	#include "tests/validation/fixtures/ArithmeticOperationsFixture.h"

	namespace arm_compute
	{
	namespace test
	{
	namespace validation
	{
	namespace
	{
	#if !defined(__aarch64__) \|\| defined(ENABLE_SVE)
	constexpr AbsoluteTolerance<float> tolerance_quant(1); /*< Tolerance value for comparing reference's output against implementation's output for quantized data types /
	#else // !defined(__aarch64__) \|\| defined(ENABLE_SVE)
	constexpr AbsoluteTolerance<float> tolerance_quant(0);
	#endif // !defined(__aarch64__) \|\| defined(ENABLE_SVE)
	const auto InPlaceDataSet = framework::dataset::make("InPlace", { false, true });
	const auto OutOfPlaceDataSet = framework::dataset::make("InPlace", { false });
	} // namespace

	TEST_SUITE(NEON)
	TEST_SUITE(ArithmeticAddition)

	template <typename T>
	using NEArithmeticAdditionFixture = ArithmeticAdditionValidationFixture<Tensor, Accessor, NEArithmeticAddition, T>;

	// INDENT-OFF
	// clang-format off
	DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(zip(
	framework::dataset::make("Input1Info", { TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::F32),
	TensorInfo(TensorShape(27U, 13U, 2U), 1, DataType::U8), // Unsupported broadcast
	TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::U8), // Invalid data type combination
	TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::F32),// Mismatching shapes
	}),
	framework::dataset::make("Input2Info",{ TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::F32),
	TensorInfo(TensorShape(1U, 13U, 2U), 1, DataType::S16),
	TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::S16),
	TensorInfo(TensorShape(48U, 11U, 2U), 1, DataType::F32),
	})),
	framework::dataset::make("OutputInfo",{ TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::F32),
	TensorInfo(TensorShape(27U, 13U, 2U), 1, DataType::S16),
	TensorInfo(TensorShape(32U, 13U, 2U), 1, DataType::U8),
	TensorInfo(TensorShape(48U, 11U, 2U), 1, DataType::F32),
	})),
	framework::dataset::make("Expected", { true, false, false, false})),
	input1_info, input2_info, output_info, expected)
	{
	Status s = NEArithmeticAddition::validate(&input1_info.clone()->set_is_resizable(false),
	&input2_info.clone()->set_is_resizable(false),
	&output_info.clone()->set_is_resizable(false),
	ConvertPolicy::WRAP);
	ARM_COMPUTE_EXPECT(bool(s) == expected, framework::LogLevel::ERRORS);
	}

	DATA_TEST_CASE(KernelSelection, framework::DatasetMode::ALL, concat(concat(
	combine(combine(framework::dataset::make("CpuExt", std::string("NEON")),
	framework::dataset::make("DataType", { DataType::F32,
	DataType::F16,
	DataType::U8,
	DataType::S16,
	DataType::S32,
	DataType::QASYMM8,
	DataType::QASYMM8_SIGNED,
	DataType::QSYMM16
	})),
	framework::dataset::make("CanUseFixedpoint", {true, false})),
	combine(combine(framework::dataset::make("CpuExt", std::string("SVE")),
	framework::dataset::make("DataType", { DataType::F32,
	DataType::F16,
	DataType::U8,
	DataType::S16,
	DataType::S32
	})),
	framework::dataset::make("CanUseFixedpoint", {true, false}))),
	combine(combine(framework::dataset::make("CpuExt", std::string("SVE2")),
	framework::dataset::make("DataType", { DataType::QASYMM8,
	DataType::QASYMM8_SIGNED,
	DataType::QSYMM16
	})),
	framework::dataset::make("CanUseFixedpoint", {true, false}))),
	cpu_ext, data_type, can_use_fixedpoint)
	{
	using namespace cpu::kernels;

	cpuinfo::CpuIsaInfo cpu_isa{};
	cpu_isa.neon = (cpu_ext == "NEON");
	cpu_isa.sve = (cpu_ext == "SVE");
	cpu_isa.sve2 = (cpu_ext == "SVE2");
	cpu_isa.fp16 = (data_type == DataType::F16);

	const auto *selected_impl = CpuAddKernel::get_implementation(CpuAddKernelDataTypeISASelectorData{data_type, cpu_isa, can_use_fixedpoint}, cpu::KernelSelectionType::Preferred);

	ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);

	bool qasymm8_any = (data_type == DataType::QASYMM8 \|\| data_type == DataType::QASYMM8_SIGNED);

	std::string expected;
	if(qasymm8_any && can_use_fixedpoint)
	{
	expected = "neon_" + cpu_impl_dt(data_type) + "_add_fixedpoint";
	}
	else
	{
	expected = lower_string(cpu_ext) + "_" + cpu_impl_dt(data_type) + "_add";
	}

	std::string actual = selected_impl->name;

	ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
	}
	// clang-format on
	// INDENT-ON

	TEST_CASE(NoPaddingAdded, framework::DatasetMode::PRECOMMIT)
	{
	// NEArithmeticAddition doesn't use padding, so make sure this is the case.
	Tensor input1 = create_tensor<Tensor>(TensorShape(15U, 15U), DataType::F32);
	Tensor input2 = create_tensor<Tensor>(TensorShape(15U, 1U), DataType::F32);
	Tensor output = create_tensor<Tensor>(TensorShape(15U, 15U), DataType::F32);

	NEArithmeticAddition add;
	add.configure(&input1, &input2, &output, ConvertPolicy::WRAP);

	// Validate padding is zero
	validate(input1.info()->padding(), PaddingSize());
	validate(input2.info()->padding(), PaddingSize());
	validate(output.info()->padding(), PaddingSize());
	}

	TEST_SUITE(Integer)
	TEST_SUITE(U8)
	FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<uint8_t>, framework::DatasetMode::PRECOMMIT, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType",
	DataType::U8)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}
	TEST_SUITE_END() // U8

	TEST_SUITE(S16)
	FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<int16_t>, framework::DatasetMode::PRECOMMIT, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType",
	DataType::S16)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}

	FIXTURE_DATA_TEST_CASE(RunLarge, NEArithmeticAdditionFixture<int16_t>, framework::DatasetMode::NIGHTLY, combine(combine(combine(datasets::LargeShapes(), framework::dataset::make("DataType",
	DataType::S16)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}
	TEST_SUITE_END() // S16

	TEST_SUITE(S32)
	FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<int32_t>, framework::DatasetMode::ALL, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType",
	DataType::S32)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}
	TEST_SUITE_END() // S32
	TEST_SUITE_END() // Integer

	TEST_SUITE(Float)
	#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
	TEST_SUITE(F16)
	FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<half>, framework::DatasetMode::ALL, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType", DataType::F16)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}
	TEST_SUITE_END() // F16
	#endif /* __ARM_FEATURE_FP16_VECTOR_ARITHMETIC */

	TEST_SUITE(F32)
	FIXTURE_DATA_TEST_CASE(RunSmall, NEArithmeticAdditionFixture<float>, framework::DatasetMode::PRECOMMIT, combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType",
	DataType::F32)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}

	FIXTURE_DATA_TEST_CASE(RunLarge, NEArithmeticAdditionFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(datasets::LargeShapes(), framework::dataset::make("DataType",
	DataType::F32)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}

	template <typename T>
	using NEArithmeticAdditionBroadcastFixture = ArithmeticAdditionBroadcastValidationFixture<Tensor, Accessor, NEArithmeticAddition, T>;

	FIXTURE_DATA_TEST_CASE(RunSmallBroadcast, NEArithmeticAdditionBroadcastFixture<float>, framework::DatasetMode::PRECOMMIT, combine(combine(combine(datasets::SmallShapesBroadcast(),
	framework::dataset::make("DataType", DataType::F32)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}

	FIXTURE_DATA_TEST_CASE(RunLargeBroadcast, NEArithmeticAdditionBroadcastFixture<float>, framework::DatasetMode::NIGHTLY, combine(combine(combine(datasets::LargeShapesBroadcast(),
	framework::dataset::make("DataType", DataType::F32)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE, ConvertPolicy::WRAP })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference);
	}
	TEST_SUITE_END() // F32
	TEST_SUITE_END() // Float

	template <typename T>
	using NEArithmeticAdditionQuantizedFixture = ArithmeticAdditionValidationQuantizedFixture<Tensor, Accessor, NEArithmeticAddition, T>;

	template <typename T>
	using NEArithmeticAdditionQuantizedBroadcastFixture = ArithmeticAdditionValidationQuantizedBroadcastFixture<Tensor, Accessor, NEArithmeticAddition, T>;

	TEST_SUITE(Quantized)
	TEST_SUITE(QASYMM8)
	FIXTURE_DATA_TEST_CASE(RunSmall,
	NEArithmeticAdditionQuantizedFixture<uint8_t>,
	framework::DatasetMode::PRECOMMIT,
	combine(combine(combine(combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType", DataType::QASYMM8)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE })),
	framework::dataset::make("Src0QInfo", { QuantizationInfo(5.f / 255.f, 20) })),
	framework::dataset::make("Src1QInfo", { QuantizationInfo(2.f / 255.f, 10) })),
	framework::dataset::make("OutQInfo", { QuantizationInfo(1.f / 255.f, 5) })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference, tolerance_quant);
	}
	TEST_SUITE_END() // QASYMM8

	TEST_SUITE(QASYMM8_SIGNED)
	FIXTURE_DATA_TEST_CASE(RunSmall,
	NEArithmeticAdditionQuantizedFixture<int8_t>,
	framework::DatasetMode::ALL,
	combine(combine(combine(combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE })),
	framework::dataset::make("Src0QInfo", { QuantizationInfo(0.5f, 20) })),
	framework::dataset::make("Src1QInfo", { QuantizationInfo(0.5f, 10) })),
	framework::dataset::make("OutQInfo", { QuantizationInfo(0.5f, 5) })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference, tolerance_quant);
	}

	FIXTURE_DATA_TEST_CASE(RunSmallBroadcast, NEArithmeticAdditionQuantizedBroadcastFixture<int8_t>, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(
	datasets::SmallShapesBroadcast(), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE })),
	framework::dataset::make("Src0QInfo", { QuantizationInfo(0.5f, 20) })),
	framework::dataset::make("Src1QInfo", { QuantizationInfo(0.5f, 10) })),
	framework::dataset::make("OutQInfo", { QuantizationInfo(0.5f, 5) })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference, tolerance_quant);
	}
	TEST_SUITE_END() // QASYMM8_SIGNED

	TEST_SUITE(QSYMM16)
	FIXTURE_DATA_TEST_CASE(RunSmall,
	NEArithmeticAdditionQuantizedFixture<int16_t>,
	framework::DatasetMode::PRECOMMIT,
	combine(combine(combine(combine(combine(combine(datasets::SmallShapes(), framework::dataset::make("DataType", DataType::QSYMM16)),
	framework::dataset::make("ConvertPolicy", { ConvertPolicy::SATURATE })),
	framework::dataset::make("Src0QInfo", { QuantizationInfo(1.f / 32768.f, 0), QuantizationInfo(5.f / 32768.f, 0) })),
	framework::dataset::make("Src1QInfo", { QuantizationInfo(2.f / 32768.f, 0), QuantizationInfo(5.f / 32768.f, 0) })),
	framework::dataset::make("OutQInfo", { QuantizationInfo(5.f / 32768.f, 0) })),
	OutOfPlaceDataSet))
	{
	// Validate output
	validate(Accessor(_target), _reference, tolerance_quant);
	}
	TEST_SUITE_END() // QSYMM16
	TEST_SUITE_END() // Quantized

	TEST_SUITE_END() // ArithmeticAddition
	TEST_SUITE_END() // Neon
	} // namespace validation
	} // namespace test
	} // namespace arm_compute