| /* |
| * Copyright (c) 2016-2019 ARM Limited. |
| * |
| * SPDX-License-Identifier: MIT |
| * |
| * Permission is hereby granted, free of charge, to any person obtaining a copy |
| * of this software and associated documentation files (the "Software"), to |
| * deal in the Software without restriction, including without limitation the |
| * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or |
| * sell copies of the Software, and to permit persons to whom the Software is |
| * furnished to do so, subject to the following conditions: |
| * |
| * The above copyright notice and this permission notice shall be included in all |
| * copies or substantial portions of the Software. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE |
| * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
| * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
| * SOFTWARE. |
| */ |
| #include "arm_compute/core/CL/kernels/CLAccumulateKernel.h" |
| |
| #include "arm_compute/core/CL/CLKernelLibrary.h" |
| #include "arm_compute/core/CL/ICLTensor.h" |
| #include "arm_compute/core/CL/OpenCL.h" |
| #include "arm_compute/core/Error.h" |
| #include "arm_compute/core/IAccessWindow.h" |
| #include "arm_compute/core/Types.h" |
| #include "arm_compute/core/Validate.h" |
| |
| namespace arm_compute |
| { |
| namespace |
| { |
| constexpr unsigned int num_elems_processed_per_iteration = 16; |
| } // namespace |
| |
| void CLAccumulateKernel::configure(const ICLTensor *input, ICLTensor *accum) |
| { |
| ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(input, 1, DataType::U8); |
| ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(accum, 1, DataType::S16); |
| |
| // Create kernel |
| _kernel = static_cast<cl::Kernel>(CLKernelLibrary::get().create_kernel("accumulate")); |
| |
| // Make sure _kernel is initialized before calling the parent's configure |
| ICLSimple2DKernel::configure(input, accum, num_elems_processed_per_iteration); |
| } |
| |
| void CLAccumulateWeightedKernel::configure(const ICLTensor *input, float alpha, ICLTensor *accum) |
| { |
| ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(input, 1, DataType::U8); |
| ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(accum, 1, DataType::U8); |
| ARM_COMPUTE_ERROR_ON(alpha < 0.0 || alpha > 1.0); |
| |
| // Create kernel |
| _kernel = static_cast<cl::Kernel>(CLKernelLibrary::get().create_kernel("accumulate_weighted")); |
| |
| // Set static kernel arguments |
| unsigned int idx = 2 * num_arguments_per_2D_tensor(); //Skip the input and output parameters |
| _kernel.setArg(idx++, alpha); |
| |
| // Configure kernel window |
| ICLSimple2DKernel::configure(input, accum, num_elems_processed_per_iteration); |
| } |
| |
| void CLAccumulateSquaredKernel::configure(const ICLTensor *input, uint32_t shift, ICLTensor *accum) |
| { |
| ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(input, 1, DataType::U8); |
| ARM_COMPUTE_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(accum, 1, DataType::S16); |
| ARM_COMPUTE_ERROR_ON(shift > 15); |
| |
| // Create kernel |
| _kernel = static_cast<cl::Kernel>(CLKernelLibrary::get().create_kernel("accumulate_squared")); |
| |
| // Set static kernel arguments |
| unsigned int idx = 2 * num_arguments_per_2D_tensor(); //Skip the input and output parameters |
| _kernel.setArg(idx++, shift); |
| |
| // Configure kernel window |
| ICLSimple2DKernel::configure(input, accum, num_elems_processed_per_iteration); |
| } |
| } // namespace arm_compute |