blob: 3a77106a42f241c5120e3c12d27b5ec378d8ec91 [file] [log] [blame]
Usama Arif9e631c22019-05-14 17:10:40 +01001/*
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +02002 * Copyright (c) 2019-2022 Arm Limited.
Usama Arif9e631c22019-05-14 17:10:40 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "arm_compute/core/Types.h"
25#include "arm_compute/runtime/NEON/functions/NECast.h"
26#include "arm_compute/runtime/Tensor.h"
27#include "arm_compute/runtime/TensorAllocator.h"
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +020028#include "src/common/cpuinfo/CpuIsaInfo.h"
29#include "src/cpu/kernels/CpuCastKernel.h"
Usama Arif9e631c22019-05-14 17:10:40 +010030#include "tests/NEON/Accessor.h"
31#include "tests/PaddingCalculator.h"
32#include "tests/datasets/ConvertPolicyDataset.h"
33#include "tests/datasets/ShapeDatasets.h"
34#include "tests/framework/Asserts.h"
35#include "tests/framework/Macros.h"
36#include "tests/framework/datasets/Datasets.h"
37#include "tests/validation/Validation.h"
38#include "tests/validation/fixtures/CastFixture.h"
Usama Arif9e631c22019-05-14 17:10:40 +010039namespace arm_compute
40{
41namespace test
42{
43namespace validation
44{
45namespace
46{
47// Tolerance
48constexpr AbsoluteTolerance<float> one_tolerance(1);
49constexpr AbsoluteTolerance<float> zero_tolerance(0);
50
51/*
52 *This function ignores the scale and zeroPoint of quanized tensors,so QASYMM8 input is treated as uint8 values.
53*/
54
55/** Input data sets **/
Luca Foschianidaa3aba2020-01-08 15:55:08 +000056
57// QASYMM8_SIGNED
58const auto CastQASYMM8_SIGNEDtoS16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::S16));
59const auto CastQASYMM8_SIGNEDtoS32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::S32));
60const auto CastQASYMM8_SIGNEDtoF32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::F32));
61const auto CastQASYMM8_SIGNEDtoF16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8_SIGNED), framework::dataset::make("DataType", DataType::F16));
62
Usama Arif9e631c22019-05-14 17:10:40 +010063// QASYMM8
Luca Foschianidaa3aba2020-01-08 15:55:08 +000064const auto CastQASYMM8toF16Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::F16));
65const auto CastQASYMM8toF32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::F32));
66const auto CastQASYMM8toS32Dataset = combine(framework::dataset::make("DataType", DataType::QASYMM8), framework::dataset::make("DataType", DataType::S32));
Usama Arif9e631c22019-05-14 17:10:40 +010067
68// U8
69const auto CastU8toU16Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::U16));
70const auto CastU8toS16Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::S16));
71const auto CastU8toS32Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::S32));
72const auto CastU8toF32Dataset = combine(framework::dataset::make("DataType", DataType::U8), framework::dataset::make("DataType", DataType::F32));
73
74// U16
75const auto CastU16toU8Dataset = combine(framework::dataset::make("DataType", DataType::U16), framework::dataset::make("DataType", DataType::U8));
76const auto CastU16toU32Dataset = combine(framework::dataset::make("DataType", DataType::U16), framework::dataset::make("DataType", DataType::U32));
77
78// S16
Luca Foschianidaa3aba2020-01-08 15:55:08 +000079const auto CastS16toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
80const auto CastS16toU8Dataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::U8));
81const auto CastS16toS32Dataset = combine(framework::dataset::make("DataType", DataType::S16), framework::dataset::make("DataType", DataType::S32));
Usama Arif9e631c22019-05-14 17:10:40 +010082
83//S32
Luca Foschianidaa3aba2020-01-08 15:55:08 +000084const auto CastS32toF16Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::F16));
85const auto CastS32toU8Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::U8));
86const auto CastS32toF32Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::F32));
87const auto CastS32toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::QASYMM8));
88const auto CastS32toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::S32), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
Usama Arif9e631c22019-05-14 17:10:40 +010089
90// F16
Luca Foschianidaa3aba2020-01-08 15:55:08 +000091const auto CastF16toF32Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::F32));
92const auto CastF16toS32Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::S32));
93const auto CastF16toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::QASYMM8));
94const auto CastF16toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::F16), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
Usama Arif9e631c22019-05-14 17:10:40 +010095
96// F32
Luca Foschianidaa3aba2020-01-08 15:55:08 +000097const auto CastF32toU8Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::U8));
98const auto CastF32toF16Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::F16));
99const auto CastF32toS32Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::S32));
100const auto CastF32toQASYMM8Dataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::QASYMM8));
101const auto CastF32toQASYMM8_SIGNEDDataset = combine(framework::dataset::make("DataType", DataType::F32), framework::dataset::make("DataType", DataType::QASYMM8_SIGNED));
Usama Arif9e631c22019-05-14 17:10:40 +0100102
103} // namespace
104
105TEST_SUITE(NEON)
106TEST_SUITE(Cast)
107template <typename T>
108using NECastToU8Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint8_t>;
109template <typename T>
110using NECastToU16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint16_t>;
111template <typename T>
112using NECastToS16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, int16_t>;
113template <typename T>
114using NECastToU32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint32_t>;
115template <typename T>
116using NECastToS32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, int32_t>;
117template <typename T>
118using NECastToF16Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, half>;
119template <typename T>
120using NECastToF32Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, float>;
121template <typename T>
122using NECastToQASYMM8Fixture = CastValidationFixture<Tensor, Accessor, NECast, T, uint8_t>;
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000123template <typename T>
124using NECastToQASYMM8_SIGNEDFixture = CastValidationFixture<Tensor, Accessor, NECast, T, int8_t>;
Usama Arif9e631c22019-05-14 17:10:40 +0100125
126#define CAST_SUITE(NAME, idt, odt, type, dataset, tolerance) \
127 TEST_SUITE(NAME) \
Usama Arif9e631c22019-05-14 17:10:40 +0100128 FIXTURE_DATA_TEST_CASE(RunSmall, type, framework::DatasetMode::PRECOMMIT, combine(combine(datasets::SmallShapes(), dataset), \
129 datasets::ConvertPolicies())) \
130 { \
131 validate(Accessor(_target), _reference, tolerance); \
132 } \
133 TEST_SUITE_END()
134
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000135//QASYMM8_SIGNED
136CAST_SUITE(QASYMM8_SIGNED_to_S16, DataType::QASYMM8_SIGNED, DataType::S16, NECastToS16Fixture<int8_t>, CastQASYMM8_SIGNEDtoS16Dataset, one_tolerance)
137CAST_SUITE(QASYMM8_SIGNED_to_S32, DataType::QASYMM8_SIGNED, DataType::S32, NECastToS32Fixture<int8_t>, CastQASYMM8_SIGNEDtoS32Dataset, one_tolerance)
138CAST_SUITE(QASYMM8_SIGNED_to_F32, DataType::QASYMM8_SIGNED, DataType::F32, NECastToF32Fixture<int8_t>, CastQASYMM8_SIGNEDtoF32Dataset, one_tolerance)
139#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
140CAST_SUITE(QASYMM8_SIGNED_to_F16, DataType::QASYMM8_SIGNED, DataType::F16, NECastToF16Fixture<int8_t>, CastQASYMM8_SIGNEDtoF16Dataset, one_tolerance)
141#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
142
Usama Arif9e631c22019-05-14 17:10:40 +0100143//QASYMM8
144#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
145CAST_SUITE(QASYMM8_to_F16, DataType::QASYMM8, DataType::F16, NECastToF16Fixture<uint8_t>, CastQASYMM8toF16Dataset, one_tolerance)
146#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
147CAST_SUITE(QASYMM8_to_F32, DataType::QASYMM8, DataType::F32, NECastToF32Fixture<uint8_t>, CastQASYMM8toF32Dataset, one_tolerance)
148CAST_SUITE(QASYMM8_to_S32, DataType::QASYMM8, DataType::S32, NECastToS32Fixture<uint8_t>, CastQASYMM8toS32Dataset, one_tolerance)
149
150// U8
151CAST_SUITE(U8_to_U16, DataType::U8, DataType::U16, NECastToU16Fixture<uint8_t>, CastU8toU16Dataset, zero_tolerance)
152CAST_SUITE(U8_to_S16, DataType::U8, DataType::S16, NECastToS16Fixture<uint8_t>, CastU8toS16Dataset, zero_tolerance)
153CAST_SUITE(U8_to_S32, DataType::U8, DataType::S32, NECastToS32Fixture<uint8_t>, CastU8toS32Dataset, zero_tolerance)
154CAST_SUITE(U8_to_F32, DataType::U8, DataType::F32, NECastToF32Fixture<uint8_t>, CastU8toF32Dataset, zero_tolerance)
155
156// U16
157CAST_SUITE(U16_to_U8, DataType::U16, DataType::U8, NECastToU8Fixture<uint16_t>, CastU16toU8Dataset, zero_tolerance)
158CAST_SUITE(U16_to_U32, DataType::U16, DataType::U32, NECastToU32Fixture<uint16_t>, CastU16toU32Dataset, zero_tolerance)
159
160// S16
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000161CAST_SUITE(S16_to_QASYMM8_SIGNED, DataType::S16, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<int16_t>, CastS16toQASYMM8_SIGNEDDataset, zero_tolerance)
Usama Arif9e631c22019-05-14 17:10:40 +0100162CAST_SUITE(S16_to_U8, DataType::S16, DataType::U8, NECastToU8Fixture<int16_t>, CastS16toU8Dataset, zero_tolerance)
163CAST_SUITE(S16_to_S32, DataType::S16, DataType::S32, NECastToS32Fixture<int16_t>, CastS16toS32Dataset, zero_tolerance)
164
165// S32
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000166CAST_SUITE(S32_to_QASYMM8_SIGNED, DataType::S32, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<int32_t>, CastS32toQASYMM8_SIGNEDDataset, one_tolerance)
Usama Arif9e631c22019-05-14 17:10:40 +0100167CAST_SUITE(S32_to_QASYMM8, DataType::S32, DataType::QASYMM8, NECastToQASYMM8Fixture<int32_t>, CastS32toQASYMM8Dataset, one_tolerance)
168#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
169CAST_SUITE(S32_to_F16, DataType::S32, DataType::F16, NECastToF16Fixture<int32_t>, CastS32toF16Dataset, zero_tolerance)
170#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
171CAST_SUITE(S32_to_F32, DataType::S32, DataType::F32, NECastToF32Fixture<int32_t>, CastS32toF32Dataset, one_tolerance)
172CAST_SUITE(S32_to_U8, DataType::S32, DataType::U8, NECastToU8Fixture<int32_t>, CastS32toU8Dataset, one_tolerance)
173
174// F16
175#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000176CAST_SUITE(F16_to_QASYMM8_SIGNED, DataType::F16, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<half>, CastF16toQASYMM8_SIGNEDDataset, one_tolerance)
Usama Arif9e631c22019-05-14 17:10:40 +0100177CAST_SUITE(F16_to_QASYMM8, DataType::F16, DataType::QASYMM8, NECastToQASYMM8Fixture<half>, CastF16toQASYMM8Dataset, one_tolerance)
178CAST_SUITE(F16_to_F32, DataType::F16, DataType::F32, NECastToF32Fixture<half>, CastF16toF32Dataset, zero_tolerance)
179CAST_SUITE(F16_to_S32, DataType::F16, DataType::S32, NECastToS32Fixture<half>, CastF16toS32Dataset, one_tolerance)
180#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
181
182// F32
Luca Foschianidaa3aba2020-01-08 15:55:08 +0000183CAST_SUITE(F32_to_QASYMM8_SIGNED, DataType::F32, DataType::QASYMM8_SIGNED, NECastToQASYMM8_SIGNEDFixture<float>, CastF32toQASYMM8_SIGNEDDataset, one_tolerance)
Usama Arif9e631c22019-05-14 17:10:40 +0100184CAST_SUITE(F32_to_QASYMM8, DataType::F32, DataType::QASYMM8, NECastToQASYMM8Fixture<float>, CastF32toQASYMM8Dataset, one_tolerance)
185#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
186CAST_SUITE(F32_to_F16, DataType::F32, DataType::F16, NECastToF16Fixture<float>, CastF32toF16Dataset, zero_tolerance)
187#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
188CAST_SUITE(F32_to_S32, DataType::F32, DataType::S32, NECastToS32Fixture<float>, CastF32toS32Dataset, one_tolerance)
189CAST_SUITE(F32_to_U8, DataType::F32, DataType::S32, NECastToS32Fixture<float>, CastF32toS32Dataset, one_tolerance)
190
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +0200191DATA_TEST_CASE(KernelSelectionDstFP16, framework::DatasetMode::ALL,
192 combine(framework::dataset::make("CpuExt", std::string("NEON")),
193 framework::dataset::make("DataType",
194{
195 DataType::F16,
196 DataType::U8,
197 DataType::S32,
198 DataType::QASYMM8,
199 DataType::QASYMM8_SIGNED,
200 DataType::BFLOAT16,
201})),
202cpu_ext, data_type)
203{
204 using namespace cpu::kernels;
205 const CpuCastKernel::CastKernel *selected_impl;
206
207 cpuinfo::CpuIsaInfo cpu_isa{};
208 cpu_isa.neon = (cpu_ext == "NEON");
209
210 cpu_isa.bf16 = (data_type == DataType::BFLOAT16);
211
212 /* bf16 cast is different from all the others being converted to fp32 and not to fp16 */
213 if(cpu_isa.bf16)
214 {
215 cpu_isa.fp16 = false;
216 selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ data_type, DataType::F32, cpu_isa }, cpu::KernelSelectionType::Preferred);
217 }
218 else
219 {
220 cpu_isa.fp16 = true;
221 selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ data_type, DataType::F16, cpu_isa }, cpu::KernelSelectionType::Preferred);
222 }
223
224 ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);
225
226 std::string expected = lower_string(cpu_ext) + "_" + cpu_impl_dt(data_type) + "_cast";
227 std::string actual = selected_impl->name;
228
229 ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
230}
231
232DATA_TEST_CASE(KernelSelectionSrcFP32, framework::DatasetMode::ALL,
233 combine(framework::dataset::make("CpuExt", std::string("NEON")),
234 framework::dataset::make("DataType",
235{
236 DataType::F16,
237 DataType::BFLOAT16,
238})),
239cpu_ext, data_type)
240{
241 using namespace cpu::kernels;
242
243 cpuinfo::CpuIsaInfo cpu_isa{};
244 cpu_isa.neon = (cpu_ext == "NEON");
245 cpu_isa.fp16 = (data_type == DataType::F16);
246 cpu_isa.bf16 = (data_type == DataType::BFLOAT16);
247
248 const auto *selected_impl = CpuCastKernel::get_implementation(CastDataTypeISASelectorData{ DataType::F32, data_type, cpu_isa }, cpu::KernelSelectionType::Preferred);
249
250 ARM_COMPUTE_ERROR_ON_NULLPTR(selected_impl);
251
252 std::string expected = lower_string(cpu_ext) + "_fp32_to_" + cpu_impl_dt(data_type) + "_cast";
253 std::string actual = selected_impl->name;
254
255 ARM_COMPUTE_EXPECT_EQUAL(expected, actual, framework::LogLevel::ERRORS);
256}
257
Usama Arif9e631c22019-05-14 17:10:40 +0100258TEST_SUITE_END() // Cast
Sheri Zhangac6499a2021-02-10 15:32:38 +0000259TEST_SUITE_END() // Neon
Usama Arif9e631c22019-05-14 17:10:40 +0100260} // namespace validation
261} // namespace test
262} // namespace arm_compute