| /* |
| * Copyright (c) 2017-2018 ARM Limited. |
| * |
| * SPDX-License-Identifier: MIT |
| * |
| * Permission is hereby granted, free of charge, to any person obtaining a copy |
| * of this software and associated documentation files (the "Software"), to |
| * deal in the Software without restriction, including without limitation the |
| * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or |
| * sell copies of the Software, and to permit persons to whom the Software is |
| * furnished to do so, subject to the following conditions: |
| * |
| * The above copyright notice and this permission notice shall be included in all |
| * copies or substantial portions of the Software. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE |
| * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
| * dst OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
| * SOFTWARE. |
| */ |
| #include "PixelWiseMultiplication.h" |
| |
| namespace arm_compute |
| { |
| namespace test |
| { |
| namespace validation |
| { |
| namespace reference |
| { |
| template <class T> |
| struct is_floating_point |
| : std::integral_constant < bool, |
| std::is_same<float, typename std::remove_cv<T>::type>::value || std::is_same<half_float::half, typename std::remove_cv<T>::type>::value |
| || std::is_same<double, typename std::remove_cv<T>::type>::value || std::is_same<long double, typename std::remove_cv<T>::type>::value > |
| { |
| }; |
| |
| namespace |
| { |
| /** Compute the result of `src1 * src2 * scale`. The result type always matches the type of @p src2. |
| * |
| * @param[in] src1 An input value. Data types supported: U8/S16/F16/F32. |
| * @param[in] src2 An input value. Data types supported: same as @p src1. |
| * @param[in] scale Scale to apply after multiplication. |
| * Scale must be positive and its value must be either 1/255 or 1/2^n where n is between 0 and 15. |
| * @param[in] convert_policy Overflow policy. Supported overflow policies: Wrap, Saturate |
| * @param[in] rounding_policy Rounding policy. Supported rounding modes: to zero, to nearest even. |
| */ |
| template <typename T1, typename T2> |
| T2 mul(const T1 src1, const T2 src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy) |
| { |
| using intermediate_type = typename common_promoted_signed_type<T1, T2, T2>::intermediate_type; |
| |
| const double val = static_cast<intermediate_type>(src1) * static_cast<intermediate_type>(src2) * static_cast<double>(scale); |
| |
| if(is_floating_point<T2>::value) |
| { |
| const auto result = static_cast<T2>(val); |
| |
| return result; |
| } |
| else |
| { |
| double rounded_val = 0; |
| switch(rounding_policy) |
| { |
| case(RoundingPolicy::TO_ZERO): |
| rounded_val = support::cpp11::trunc(val); |
| break; |
| case(RoundingPolicy::TO_NEAREST_UP): |
| rounded_val = round_half_up(val); |
| break; |
| case(RoundingPolicy::TO_NEAREST_EVEN): |
| rounded_val = round_half_even(val); |
| break; |
| default: |
| ARM_COMPUTE_ERROR("Unsupported rounding policy"); |
| } |
| |
| const auto result = static_cast<T2>((convert_policy == ConvertPolicy::SATURATE) ? saturate_cast<T2>(rounded_val) : rounded_val); |
| |
| return result; |
| } |
| } |
| |
| template <size_t dim> |
| struct BroadcastUnroll |
| { |
| template <typename T1, typename T2> |
| static void unroll(const SimpleTensor<T1> &src1, const SimpleTensor<T2> &src2, SimpleTensor<T2> &dst, |
| float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, |
| Coordinates &id_src1, Coordinates &id_src2, Coordinates &id_dst) |
| { |
| const bool src1_is_broadcast = (src1.shape()[dim - 1] != dst.shape()[dim - 1]); |
| const bool src2_is_broadcast = (src2.shape()[dim - 1] != dst.shape()[dim - 1]); |
| |
| id_src1.set(dim - 1, 0); |
| id_src2.set(dim - 1, 0); |
| id_dst.set(dim - 1, 0); |
| |
| for(size_t i = 0; i < dst.shape()[dim - 1]; ++i, ++id_dst[dim - 1]) |
| { |
| BroadcastUnroll < dim - 1 >::unroll(src1, src2, dst, scale, convert_policy, rounding_policy, id_src1, id_src2, id_dst); |
| |
| id_src1[dim - 1] += !src1_is_broadcast; |
| id_src2[dim - 1] += !src2_is_broadcast; |
| } |
| } |
| }; |
| |
| template <> |
| struct BroadcastUnroll<0> |
| { |
| template <typename T1, typename T2> |
| static void unroll(const SimpleTensor<T1> &src1, const SimpleTensor<T2> &src2, SimpleTensor<T2> &dst, |
| float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy, |
| Coordinates &id_src1, Coordinates &id_src2, Coordinates &id_dst) |
| { |
| dst[coord2index(dst.shape(), id_dst)] = mul(src1[coord2index(src1.shape(), id_src1)], src2[coord2index(src2.shape(), id_src2)], scale, convert_policy, rounding_policy); |
| } |
| }; |
| } // namespace |
| |
| template <typename T1, typename T2> |
| SimpleTensor<T2> pixel_wise_multiplication(const SimpleTensor<T1> &src1, const SimpleTensor<T2> &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy) |
| { |
| SimpleTensor<T2> dst(TensorShape::broadcast_shape(src1.shape(), src2.shape()), src2.data_type()); |
| |
| if(scale < 0) |
| { |
| ARM_COMPUTE_ERROR("Scale of pixel-wise multiplication must be non-negative"); |
| } |
| |
| Coordinates id_src1, id_src2, id_dst; |
| |
| BroadcastUnroll<Coordinates::num_max_dimensions>::unroll(src1, src2, dst, scale, convert_policy, rounding_policy, id_src1, id_src2, id_dst); |
| |
| return dst; |
| } |
| |
| // *INDENT-OFF* |
| // clang-format off |
| template SimpleTensor<uint8_t> pixel_wise_multiplication(const SimpleTensor<uint8_t> &src1, const SimpleTensor<uint8_t> &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy); |
| template SimpleTensor<int16_t> pixel_wise_multiplication(const SimpleTensor<uint8_t> &src1, const SimpleTensor<int16_t> &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy); |
| template SimpleTensor<int16_t> pixel_wise_multiplication(const SimpleTensor<int16_t> &src1, const SimpleTensor<int16_t> &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy); |
| template SimpleTensor<float> pixel_wise_multiplication(const SimpleTensor<float> &src1, const SimpleTensor<float> &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy); |
| template SimpleTensor<half_float::half> pixel_wise_multiplication(const SimpleTensor<half_float::half> &src1, const SimpleTensor<half_float::half> &src2, float scale, ConvertPolicy convert_policy, RoundingPolicy rounding_policy); |
| // clang-format on |
| // *INDENT-ON* |
| } // namespace reference |
| } // namespace validation |
| } // namespace test |
| } // namespace arm_compute |