blob: 166847ed66fc289a3097081f8c7f596b219aa8ff [file] [log] [blame]
Usama Arif9e631c22019-05-14 17:10:40 +01001/*
Matthew Bentham314d3e22023-06-23 10:53:52 +00002 * Copyright (c) 2019-2023 Arm Limited.
Usama Arif9e631c22019-05-14 17:10:40 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "arm_compute/core/Types.h"
Matthew Bentham314d3e22023-06-23 10:53:52 +000025#include "arm_compute/core/utils/StringUtils.h"
Usama Arif9e631c22019-05-14 17:10:40 +010026#include "arm_compute/runtime/NEON/functions/NECast.h"
27#include "arm_compute/runtime/Tensor.h"
28#include "arm_compute/runtime/TensorAllocator.h"
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +020029#include "src/common/cpuinfo/CpuIsaInfo.h"
30#include "src/cpu/kernels/CpuCastKernel.h"
Usama Arif9e631c22019-05-14 17:10:40 +010031#include "tests/NEON/Accessor.h"
32#include "tests/PaddingCalculator.h"
33#include "tests/datasets/ConvertPolicyDataset.h"
34#include "tests/datasets/ShapeDatasets.h"
35#include "tests/framework/Asserts.h"
36#include "tests/framework/Macros.h"
37#include "tests/framework/datasets/Datasets.h"
38#include "tests/validation/Validation.h"
39#include "tests/validation/fixtures/CastFixture.h"
Usama Arif9e631c22019-05-14 17:10:40 +010040namespace arm_compute
41{
42namespace test
43{
44namespace validation
45{
46namespace
47{
48// Tolerance
49constexpr AbsoluteTolerance<float> one_tolerance(1);
50constexpr AbsoluteTolerance<float> zero_tolerance(0);
51
52/*
53 *This function ignores the scale and zeroPoint of quanized tensors,so QASYMM8 input is treated as uint8 values.
54*/
55
56/** Input data sets **/
Luca Foschianidaa3aba2020-01-08 15:55:08 +000057
58// QASYMM8_SIGNED
59const auto CastQASYMM8_SIGNEDtoS16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::S16));
60const auto CastQASYMM8_SIGNEDtoS32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::S32));
61const auto CastQASYMM8_SIGNEDtoF32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::F32));
62const auto CastQASYMM8_SIGNEDtoF16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::F16));
63
Usama Arif9e631c22019-05-14 17:10:40 +010064// QASYMM8
Luca Foschianidaa3aba2020-01-08 15:55:08 +000065const auto CastQASYMM8toF16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::F16));
66const auto CastQASYMM8toF32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::F32));
67const auto CastQASYMM8toS32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::S32));
Usama Arif9e631c22019-05-14 17:10:40 +010068
69// U8
70const auto CastU8toU16Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::U16));
71const auto CastU8toS16Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::S16));
72const auto CastU8toS32Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::S32));
73const auto CastU8toF32Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::F32));
74
75// U16
76const auto CastU16toU8Dataset = combine(framework::dataset::make("DataType", DataType::U16), framework::dataset::make("DataType", DataType::U8));
77const auto CastU16toU32Dataset = combine(framework::dataset::make("DataType", DataType::U16), framework::dataset::make("DataType", DataType::U32));
78
79// S16
Luca Foschianidaa3aba2020-01-08 15:55:08 +000080const auto CastS16toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
81const auto CastS16toU8Dataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::U8));
82const auto CastS16toS32Dataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::S32));
Usama Arif9e631c22019-05-14 17:10:40 +010083
84//S32
Luca Foschianidaa3aba2020-01-08 15:55:08 +000085const auto CastS32toF16Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::F16));
86const auto CastS32toU8Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::U8));
87const auto CastS32toF32Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::F32));
88const auto CastS32toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::QASYMM8));
89const auto CastS32toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
Usama Arif9e631c22019-05-14 17:10:40 +010090
91// F16
Luca Foschianidaa3aba2020-01-08 15:55:08 +000092const auto CastF16toF32Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::F32));
93const auto CastF16toS32Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::S32));
94const auto CastF16toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::QASYMM8));
95const auto CastF16toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
Usama Arif9e631c22019-05-14 17:10:40 +010096
97// F32
Luca Foschianidaa3aba2020-01-08 15:55:08 +000098const auto CastF32toU8Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::U8));
99const auto CastF32toF16Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::F16));
100const auto CastF32toS32Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::S32));
101const auto CastF32toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::QASYMM8));
102const auto CastF32toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
Usama Arif9e631c22019-05-14 17:10:40 +0100103
104} // namespace
105
106TEST_SUITE(NEON)
107TEST_SUITE(Cast)
108template <typename T>
109using NECastToU8Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint8_t>;
110template <typename T>
111using NECastToU16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint16_t>;
112template <typename T>
113using NECastToS16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, int16_t>;
114template <typename T>
115using NECastToU32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint32_t>;
116template <typename T>
117using NECastToS32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, int32_t>;
118template <typename T>
119using NECastToF16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, half>;
120template <typename T>
121using NECastToF32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, float>;
122template <typename T>
123using NECastToQASYMM8Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint8_t>;
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000124template <typename T>
125using NECastToQASYMM8_SIGNEDFixture = CastValidationFixture<Tensor, Accessor, NECast, T, int8_t>;
Usama Arif9e631c22019-05-14 17:10:40 +0100126
127#define CAST_SUITE(NAME, idt, odt, type, dataset, tolerance) \
128 TEST_SUITE(NAME) \
Usama Arif9e631c22019-05-14 17:10:40 +0100129 FIXTURE_DATA_TEST_CASE(RunSmall, type, framework::DatasetMode::PRECOMMIT, combine(combine(datasets::SmallShapes(), dataset), \
130 datasets::ConvertPolicies())) \
131 { \
132 validate(Accessor(_target), _reference, tolerance); \
133 } \
134 TEST_SUITE_END()
135
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000136//QASYMM8_SIGNED
137CAST_SUITE(QASYMM8_SIGNED_to_S16, DataType::QASYMM8_SIGNED, DataType::S16, NECastToS16Fixture<int8_t>, CastQASYMM8_SIGNEDtoS16Dataset, one_tolerance)
138CAST_SUITE(QASYMM8_SIGNED_to_S32, DataType::QASYMM8_SIGNED, DataType::S32, NECastToS32Fixture<int8_t>, CastQASYMM8_SIGNEDtoS32Dataset, one_tolerance)
139CAST_SUITE(QASYMM8_SIGNED_to_F32, DataType::QASYMM8_SIGNED, DataType::F32, NECastToF32Fixture<int8_t>, CastQASYMM8_SIGNEDtoF32Dataset, one_tolerance)
140#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
141CAST_SUITE(QASYMM8_SIGNED_to_F16, DataType::QASYMM8_SIGNED, DataType::F16, NECastToF16Fixture<int8_t>, CastQASYMM8_SIGNEDtoF16Dataset, one_tolerance)
142#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
143
Usama Arif9e631c22019-05-14 17:10:40 +0100144//QASYMM8
145#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
146CAST_SUITE(QASYMM8_to_F16, DataType::QASYMM8, DataType::F16, NECastToF16Fixture<uint8_t>, CastQASYMM8toF16Dataset, one_tolerance)
147#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
148CAST_SUITE(QASYMM8_to_F32, DataType::QASYMM8, DataType::F32, NECastToF32Fixture<uint8_t>, CastQASYMM8toF32Dataset, one_tolerance)
149CAST_SUITE(QASYMM8_to_S32, DataType::QASYMM8, DataType::S32, NECastToS32Fixture<uint8_t>, CastQASYMM8toS32Dataset, one_tolerance)
150
151// U8
152CAST_SUITE(U8_to_U16, DataType::U8, DataType::U16, NECastToU16Fixture<uint8_t>, CastU8toU16Dataset, zero_tolerance)
153CAST_SUITE(U8_to_S16, DataType::U8, DataType::S16, NECastToS16Fixture<uint8_t>, CastU8toS16Dataset, zero_tolerance)
154CAST_SUITE(U8_to_S32, DataType::U8, DataType::S32, NECastToS32Fixture<uint8_t>, CastU8toS32Dataset, zero_tolerance)
155CAST_SUITE(U8_to_F32, DataType::U8, DataType::F32, NECastToF32Fixture<uint8_t>, CastU8toF32Dataset, zero_tolerance)
156
157// U16
158CAST_SUITE(U16_to_U8, DataType::U16, DataType::U8, NECastToU8Fixture<uint16_t>, CastU16toU8Dataset, zero_tolerance)
159CAST_SUITE(U16_to_U32, DataType::U16, DataType::U32, NECastToU32Fixture<uint16_t>, CastU16toU32Dataset, zero_tolerance)
160
161// S16
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000162CAST_SUITE(S16_to_QASYMM8_SIGNED, DataType::S16, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<int16_t>, CastS16toQASYMM8_SIGNEDDataset, zero_tolerance)
Usama Arif9e631c22019-05-14 17:10:40 +0100163CAST_SUITE(S16_to_U8, DataType::S16, DataType::U8, NECastToU8Fixture<int16_t>, CastS16toU8Dataset, zero_tolerance)
164CAST_SUITE(S16_to_S32, DataType::S16, DataType::S32, NECastToS32Fixture<int16_t>, CastS16toS32Dataset, zero_tolerance)
165
166// S32
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000167CAST_SUITE(S32_to_QASYMM8_SIGNED, DataType::S32, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<int32_t>, CastS32toQASYMM8_SIGNEDDataset, one_tolerance)
Usama Arif9e631c22019-05-14 17:10:40 +0100168CAST_SUITE(S32_to_QASYMM8, DataType::S32, DataType::QASYMM8, NECastToQASYMM8Fixture<int32_t>, CastS32toQASYMM8Dataset, one_tolerance)
169#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
170CAST_SUITE(S32_to_F16, DataType::S32, DataType::F16, NECastToF16Fixture<int32_t>, CastS32toF16Dataset, zero_tolerance)
171#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
172CAST_SUITE(S32_to_F32, DataType::S32, DataType::F32, NECastToF32Fixture<int32_t>, CastS32toF32Dataset, one_tolerance)
173CAST_SUITE(S32_to_U8, DataType::S32, DataType::U8, NECastToU8Fixture<int32_t>, CastS32toU8Dataset, one_tolerance)
174
175// F16
176#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000177CAST_SUITE(F16_to_QASYMM8_SIGNED, DataType::F16, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<half>, CastF16toQASYMM8_SIGNEDDataset, one_tolerance)
Usama Arif9e631c22019-05-14 17:10:40 +0100178CAST_SUITE(F16_to_QASYMM8, DataType::F16, DataType::QASYMM8, NECastToQASYMM8Fixture<half>, CastF16toQASYMM8Dataset, one_tolerance)
179CAST_SUITE(F16_to_F32, DataType::F16, DataType::F32, NECastToF32Fixture<half>, CastF16toF32Dataset, zero_tolerance)
180CAST_SUITE(F16_to_S32, DataType::F16, DataType::S32, NECastToS32Fixture<half>, CastF16toS32Dataset, one_tolerance)
181#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
182
183// F32
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000184CAST_SUITE(F32_to_QASYMM8_SIGNED, DataType::F32, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<float>, CastF32toQASYMM8_SIGNEDDataset, one_tolerance)
Usama Arif9e631c22019-05-14 17:10:40 +0100185CAST_SUITE(F32_to_QASYMM8, DataType::F32, DataType::QASYMM8, NECastToQASYMM8Fixture<float>, CastF32toQASYMM8Dataset, one_tolerance)
186#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
187CAST_SUITE(F32_to_F16, DataType::F32, DataType::F16, NECastToF16Fixture<float>, CastF32toF16Dataset, zero_tolerance)
188#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
189CAST_SUITE(F32_to_S32, DataType::F32, DataType::S32, NECastToS32Fixture<float>, CastF32toS32Dataset, one_tolerance)
190CAST_SUITE(F32_to_U8, DataType::F32, DataType::S32, NECastToS32Fixture<float>, CastF32toS32Dataset, one_tolerance)
191
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +0200192DATA_TEST_CASE(KernelSelectionDstFP16, framework::DatasetMode::ALL,
193 combine(framework::dataset::make("CpuExt", std::string("NEON")),
194 framework::dataset::make("DataType",
195{
196 DataType::F16,
197 DataType::U8,
198 DataType::S32,
199 DataType::QASYMM8,
200 DataType::QASYMM8_SIGNED,
201 DataType::BFLOAT16,
202})),
203cpu_ext, data_type)
204{
205 using namespace cpu::kernels;
206 const CpuCastKernel::CastKernel *selected_impl;
207
208 cpuinfo::CpuIsaInfo cpu_isa{};
209 cpu_isa.neon = (cpu_ext == "NEON");
210
211 cpu_isa.bf16 = (data_type == DataType::BFLOAT16);
212
213 /* bf16 cast is different from all the others being converted to fp32 and not to fp16 */
214 if(cpu_isa.bf16)
215 {
216 cpu_isa.fp16 = false;
217 selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ data_type, DataType::F32, cpu_isa }, cpu::KernelSelectionType::Preferred);
218 }
219 else
220 {
221 cpu_isa.fp16 = true;
222 selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ data_type, DataType::F16, cpu_isa }, cpu::KernelSelectionType::Preferred);
223 }
224
225 ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);
226
227 std::string expected = lower_string(cpu_ext) + "_" + cpu_impl_dt(data_type) + "_cast";
228 std::string actual = selected_impl->name;
229
230 ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
231}
232
233DATA_TEST_CASE(KernelSelectionSrcFP32, framework::DatasetMode::ALL,
234 combine(framework::dataset::make("CpuExt", std::string("NEON")),
235 framework::dataset::make("DataType",
236{
237 DataType::F16,
238 DataType::BFLOAT16,
239})),
240cpu_ext, data_type)
241{
242 using namespace cpu::kernels;
243
244 cpuinfo::CpuIsaInfo cpu_isa{};
245 cpu_isa.neon = (cpu_ext == "NEON");
246 cpu_isa.fp16 = (data_type == DataType::F16);
247 cpu_isa.bf16 = (data_type == DataType::BFLOAT16);
248
249 const auto *selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ DataType::F32, data_type, cpu_isa }, cpu::KernelSelectionType::Preferred);
250
251 ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);
252
253 std::string expected = lower_string(cpu_ext) + "_fp32_to_" + cpu_impl_dt(data_type) + "_cast";
254 std::string actual = selected_impl->name;
255
256 ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
257}
258
Usama Arif9e631c22019-05-14 17:10:40 +0100259TEST_SUITE_END() // Cast
Sheri Zhangac6499a2021-02-10 15:32:38 +0000260TEST_SUITE_END() // Neon
Usama Arif9e631c22019-05-14 17:10:40 +0100261} // namespace validation
262} // namespace test
263} // namespace arm_compute