blob: b42f13ae4753c7a45e4d814b3032ffde43dd6dc1 [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
2 * Copyright (c) 2017 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
24#include "Globals.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010025#include "NEON/NEAccessor.h"
26#include "TensorLibrary.h"
27#include "TypePrinter.h"
28#include "Utils.h"
29#include "validation/Datasets.h"
30#include "validation/ReferenceCPP.h"
31#include "validation/Validation.h"
32
33#include "arm_compute/core/Helpers.h"
34#include "arm_compute/core/NEON/NEFixedPoint.h"
35#include "arm_compute/core/Types.h"
36#include "arm_compute/runtime/Tensor.h"
37#include "arm_compute/runtime/TensorAllocator.h"
38
39#include "boost_wrapper.h"
40
41#include <random>
42#include <string>
43
44using namespace arm_compute;
45using namespace arm_compute::test;
46using namespace arm_compute::test::neon;
47using namespace arm_compute::test::validation;
48
49namespace
50{
51const float tolerance = 3; /**< Tolerance value for comparing reference's output against implementation's output */
52
53/** Compute Neon reciprocal function for signed 8bit fixed point.
54 *
55 * @param[in] shape Shape of the input and output tensors.
56 *
57 * @return Computed output tensor.
58 */
59Tensor compute_reciprocal_qs8(const TensorShape &shape, int fixed_point_position)
60{
61 // Create tensors
Moritz Pflanzer94450f12017-06-30 12:48:43 +010062 Tensor src = create_tensor<Tensor>(shape, DataType::QS8, 1, fixed_point_position);
63 Tensor dst = create_tensor<Tensor>(shape, DataType::QS8, 1, fixed_point_position);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010064
65 constexpr unsigned int num_elems_processed_per_iteration = 16;
66 Window window = calculate_max_window(*src.info(), Steps(num_elems_processed_per_iteration));
67 AccessWindowHorizontal input_access(src.info(), 0, num_elems_processed_per_iteration);
68 AccessWindowHorizontal output_access(dst.info(), 0, num_elems_processed_per_iteration);
69
70 update_window_and_padding(window, input_access, output_access);
71 output_access.set_valid_region(window, src.info()->valid_region());
72
73 // Allocate tensors
74 src.allocator()->allocate();
75 dst.allocator()->allocate();
76
77 BOOST_TEST(!src.info()->is_resizable());
78 BOOST_TEST(!dst.info()->is_resizable());
79
Michalis Spyrou0a8334c2017-06-14 18:00:05 +010080 // Fill tensors. Keep the range between [15, 100) so the result won't
Anthony Barbier6ff3b192017-09-04 18:44:23 +010081 // overflow. E.g. for Q2.5 reciprocal(0.001) = 1000, which cannot be represented.
Michalis Spyrou0a8334c2017-06-14 18:00:05 +010082 std::uniform_int_distribution<> distribution(15, 0x7F);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010083 library->fill(NEAccessor(src), distribution, 0);
84
85 Iterator input(&src, window);
86 Iterator output(&dst, window);
87
88 execute_window_loop(window, [&](const Coordinates & id)
89 {
90 qint8x16_t in = vld1q_s8(reinterpret_cast<const qint8_t *>(input.ptr()));
91 vst1q_s8(reinterpret_cast<qint8_t *>(output.ptr()), vrecipq_qs8(in, fixed_point_position));
92 },
93 input, output);
94
95 return dst;
96}
97} // namespace
98
99#ifndef DOXYGEN_SKIP_THIS
100BOOST_AUTO_TEST_SUITE(NEON)
101BOOST_AUTO_TEST_SUITE(FixedPoint)
102BOOST_AUTO_TEST_SUITE(QS8)
103BOOST_AUTO_TEST_SUITE(Reciprocal)
104
105BOOST_TEST_DECORATOR(*boost::unit_test::label("precommit") * boost::unit_test::label("nightly"))
106BOOST_DATA_TEST_CASE(RunSmall, Small1DShape() * boost::unit_test::data::xrange(1, 6), shape, fixed_point_position)
107{
108 // Compute function
109 Tensor dst = compute_reciprocal_qs8(shape, fixed_point_position);
110
111 // Compute reference
112 RawTensor ref_dst = Reference::compute_reference_fixed_point_operation(shape, DataType::QS8, DataType::QS8, FixedPointOp::RECIPROCAL, fixed_point_position);
113
114 // Validate output
115 validate(NEAccessor(dst), ref_dst, tolerance, 0);
116}
117
118BOOST_AUTO_TEST_SUITE_END()
119BOOST_AUTO_TEST_SUITE_END()
120BOOST_AUTO_TEST_SUITE_END()
121BOOST_AUTO_TEST_SUITE_END()
Anthony Barbierac69aa12017-07-03 17:39:37 +0100122#endif /* DOXYGEN_SKIP_THIS */