blob: f4bd4e6cadc59aa5934792f71e31ded7532ff69c [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
SiCong Lic0463a22023-05-17 13:46:13 +01002 * Copyright (c) 2017-2023 Arm Limited.
Anthony Barbier6ff3b192017-09-04 18:44:23 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Georgios Pinitas7891a732021-08-20 21:39:25 +010024#include "src/cpu/kernels/CpuActivationKernel.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010025
Anthony Barbier6ff3b192017-09-04 18:44:23 +010026#include "arm_compute/core/ITensor.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010027#include "arm_compute/core/TensorInfo.h"
28#include "arm_compute/core/Utils.h"
Sang-Hoon Park68dd25f2020-10-19 16:00:11 +010029#include "src/core/CPP/Validate.h"
Sang-Hoon Park68dd25f2020-10-19 16:00:11 +010030#include "src/core/helpers/AutoConfiguration.h"
31#include "src/core/helpers/WindowHelpers.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010032
Michalis Spyrouc4d45552020-10-19 12:41:30 +010033#include "src/core/common/Registrars.h"
Georgios Pinitas7891a732021-08-20 21:39:25 +010034#include "src/cpu/kernels/activation/list.h"
Michalis Spyrouc4d45552020-10-19 12:41:30 +010035
Georgios Pinitasf8f04422021-01-08 17:25:55 +000036#include <array>
Anthony Barbier6ff3b192017-09-04 18:44:23 +010037
Michele Di Giorgiof9b595a2020-07-03 13:34:52 +010038namespace arm_compute
39{
Georgios Pinitasf8f04422021-01-08 17:25:55 +000040namespace cpu
41{
42namespace kernels
43{
Michalis Spyrouafa5d812017-11-30 14:25:57 +000044namespace
45{
Giorgio Arena5ae8d802021-11-18 18:02:13 +000046static const std::vector<CpuActivationKernel::ActivationKernel> available_kernels =
Michalis Spyrouc4d45552020-10-19 12:41:30 +010047{
Pablo Marquez Tellod1586092022-06-10 14:37:10 +010048#ifdef ARM_COMPUTE_ENABLE_SVE
49 {
SiCong Lic0463a22023-05-17 13:46:13 +010050 "sve2_q8_activation_lut",
Pablo Marquez Tello48cfd5f2023-06-09 11:22:29 +010051 [](const ActivationDataTypeISASelectorData & data) { return (data.dt == DataType::QASYMM8 || data.dt == DataType::QASYMM8_SIGNED) && data.cpumodel == CPUModel::A510 && data.isa.sve2; },
SiCong Lic0463a22023-05-17 13:46:13 +010052 REGISTER_QASYMM8_SVE2(arm_compute::cpu::sve2_q8_activation_lut)
Pablo Marquez Tellod1586092022-06-10 14:37:10 +010053 },
54#endif // ARM_COMPUTE_ENABLE_SVE
Viet-Hoa Dob042e392022-06-21 15:56:15 +010055#ifdef __aarch64__
Murray Kornelsen926f5022022-07-13 21:22:39 -040056 {
57 // Neon LUT implementantion takes precedence
Viet-Hoa Do29db3d22022-08-10 11:56:49 +010058 "neon_q8_activation_lut",
Pablo Marquez Tello48cfd5f2023-06-09 11:22:29 +010059 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::QASYMM8 || data.dt == DataType::QASYMM8_SIGNED; },
Viet-Hoa Do29db3d22022-08-10 11:56:49 +010060 REGISTER_Q8_NEON(arm_compute::cpu::neon_q8_activation_lut)
Pablo Marquez Tello700b9132022-06-22 11:23:53 +010061 },
Viet-Hoa Dob042e392022-06-21 15:56:15 +010062#endif // __aarch64__
Michalis Spyrouaa51a5b2020-11-22 00:49:42 +000063 {
Dana Zlotnika538ae52022-02-21 13:12:41 +020064 "sve2_qu8_activation",
Murray Kornelsen926f5022022-07-13 21:22:39 -040065 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::QASYMM8 && data.isa.sve2 && data.f != ActivationLayerInfo::ActivationFunction::GELU; },
Dana Zlotnika538ae52022-02-21 13:12:41 +020066 REGISTER_QASYMM8_SVE2(arm_compute::cpu::sve2_qasymm8_activation)
67 },
68 {
69 "sve2_qs8_activation",
Murray Kornelsen926f5022022-07-13 21:22:39 -040070 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::QASYMM8_SIGNED && data.isa.sve2 && data.f != ActivationLayerInfo::ActivationFunction::GELU; },
Dana Zlotnika538ae52022-02-21 13:12:41 +020071 REGISTER_QASYMM8_SIGNED_SVE2(arm_compute::cpu::sve2_qasymm8_signed_activation)
72 },
73 {
74 "sve2_qs16_activation",
Murray Kornelsen926f5022022-07-13 21:22:39 -040075 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::QSYMM16 && data.isa.sve2 && data.f != ActivationLayerInfo::ActivationFunction::GELU; },
Dana Zlotnika538ae52022-02-21 13:12:41 +020076 REGISTER_QSYMM16_SVE2(arm_compute::cpu::sve2_qsymm16_activation)
77 },
78 {
Georgios Pinitas5fdde992021-06-25 05:42:57 +010079 "sve_fp16_activation",
Murray Kornelsen926f5022022-07-13 21:22:39 -040080 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::F16 && data.isa.sve && data.isa.fp16 && data.f != ActivationLayerInfo::ActivationFunction::GELU; },
Dana Zlotnik32291712021-11-25 09:58:27 +020081 REGISTER_FP16_SVE(arm_compute::cpu::sve_fp16_activation)
Michalis Spyrouaa51a5b2020-11-22 00:49:42 +000082 },
83 {
Georgios Pinitas5fdde992021-06-25 05:42:57 +010084 "sve_fp32_activation",
Murray Kornelsen926f5022022-07-13 21:22:39 -040085 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::F32 && data.isa.sve && data.f != ActivationLayerInfo::ActivationFunction::GELU; },
Dana Zlotnik32291712021-11-25 09:58:27 +020086 REGISTER_FP32_SVE(arm_compute::cpu::sve_fp32_activation)
Michalis Spyrouaa51a5b2020-11-22 00:49:42 +000087 },
Michalis Spyrouc4d45552020-10-19 12:41:30 +010088 {
Georgios Pinitas5fdde992021-06-25 05:42:57 +010089 "neon_fp16_activation",
Pablo Marquez Tellod75cd8a2022-05-26 14:19:39 +010090 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::F16 && data.isa.fp16; },
Dana Zlotnik32291712021-11-25 09:58:27 +020091 REGISTER_FP16_NEON(arm_compute::cpu::neon_fp16_activation)
Michalis Spyrouc4d45552020-10-19 12:41:30 +010092 },
93 {
Georgios Pinitas5fdde992021-06-25 05:42:57 +010094 "neon_fp32_activation",
Pablo Marquez Tellod75cd8a2022-05-26 14:19:39 +010095 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::F32; },
Dana Zlotnik32291712021-11-25 09:58:27 +020096 REGISTER_FP32_NEON(arm_compute::cpu::neon_fp32_activation)
Michalis Spyrouc4d45552020-10-19 12:41:30 +010097 },
Michalis Spyrouaa51a5b2020-11-22 00:49:42 +000098 {
Georgios Pinitas5fdde992021-06-25 05:42:57 +010099 "neon_qu8_activation",
Viet-Hoa Dob042e392022-06-21 15:56:15 +0100100 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::QASYMM8; },
Dana Zlotnik32291712021-11-25 09:58:27 +0200101 REGISTER_QASYMM8_NEON(arm_compute::cpu::neon_qasymm8_activation)
Michalis Spyrouc4d45552020-10-19 12:41:30 +0100102 },
103 {
Georgios Pinitas5fdde992021-06-25 05:42:57 +0100104 "neon_qs8_activation",
Pablo Marquez Tellod75cd8a2022-05-26 14:19:39 +0100105 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::QASYMM8_SIGNED; },
Dana Zlotnik32291712021-11-25 09:58:27 +0200106 REGISTER_QASYMM8_SIGNED_NEON(arm_compute::cpu::neon_qasymm8_signed_activation)
Michalis Spyrouc4d45552020-10-19 12:41:30 +0100107 },
108 {
Georgios Pinitas5fdde992021-06-25 05:42:57 +0100109 "neon_qs16_activation",
Pablo Marquez Tellod75cd8a2022-05-26 14:19:39 +0100110 [](const ActivationDataTypeISASelectorData & data) { return data.dt == DataType::QSYMM16; },
Dana Zlotnik32291712021-11-25 09:58:27 +0200111 REGISTER_QSYMM16_NEON(arm_compute::cpu::neon_qsymm16_activation)
Michalis Spyrouc4d45552020-10-19 12:41:30 +0100112 },
113};
114
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000115/* Supported activation in the 8-bit integer domain */
Murray Kornelsen926f5022022-07-13 21:22:39 -0400116static const std::array<ActivationLayerInfo::ActivationFunction, 8> qasymm8_activations =
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000117{
118 ActivationLayerInfo::ActivationFunction::RELU,
119 ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU,
120 ActivationLayerInfo::ActivationFunction::BOUNDED_RELU,
121 ActivationLayerInfo::ActivationFunction::LOGISTIC,
122 ActivationLayerInfo::ActivationFunction::TANH,
123 ActivationLayerInfo::ActivationFunction::HARD_SWISH,
124 ActivationLayerInfo::ActivationFunction::LEAKY_RELU,
Murray Kornelsen926f5022022-07-13 21:22:39 -0400125 ActivationLayerInfo::ActivationFunction::GELU,
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000126};
127/* Supported activation in the 16-bit integer domain */
Pablo Marquez Tellof55cca52022-04-06 14:31:25 +0100128static const std::array<ActivationLayerInfo::ActivationFunction, 4> qsymm16_activations =
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000129{
130 ActivationLayerInfo::ActivationFunction::LOGISTIC,
131 ActivationLayerInfo::ActivationFunction::TANH,
Pablo Marquez Tellof55cca52022-04-06 14:31:25 +0100132 ActivationLayerInfo::ActivationFunction::HARD_SWISH,
133 ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000134};
135
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000136Status validate_arguments(const ITensorInfo *src, const ITensorInfo *dst, const ActivationLayerInfo &activation_info)
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000137{
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000138 ARM_COMPUTE_RETURN_ERROR_ON_CPU_F16_UNSUPPORTED(src);
139 ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(src, 1, DataType::QASYMM8_SIGNED, DataType::QASYMM8, DataType::QSYMM16, DataType::F16, DataType::F32);
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000140
Pablo Marquez Tellod1586092022-06-10 14:37:10 +0100141 const auto *uk = CpuActivationKernel::get_implementation(ActivationDataTypeISASelectorData{ src->data_type(), CPUInfo::get().get_cpu_model(), CPUInfo::get().get_isa(), activation_info.activation() });
Michalis Spyrouc4d45552020-10-19 12:41:30 +0100142 ARM_COMPUTE_RETURN_ERROR_ON(uk == nullptr || uk->ukernel == nullptr);
143
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000144 const DataType data_type = src->data_type();
145 const QuantizationInfo &oq_info = (dst != nullptr) ? dst->quantization_info() : src->quantization_info();
Georgios Pinitas4b3fba12019-06-04 17:31:46 +0100146 const ActivationLayerInfo::ActivationFunction f_act = activation_info.activation();
147
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000148 ARM_COMPUTE_RETURN_ERROR_ON_MSG(is_data_type_quantized_asymmetric(data_type) && (std::find(std::begin(qasymm8_activations), std::end(qasymm8_activations), f_act) == std::end(qasymm8_activations)),
Sang-Hoon Parkadd8e812020-11-25 11:46:03 +0000149 "For QASYMM8 only hard swish, leaky relu, tanh, logistic, relu and lower/upper bounded relu are supported");
giuros01c9573f32019-06-20 10:30:17 +0100150
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000151 ARM_COMPUTE_RETURN_ERROR_ON_MSG(is_data_type_quantized_symmetric(data_type) && (std::find(std::begin(qsymm16_activations), std::end(qsymm16_activations), f_act) == std::end(qsymm16_activations)),
giuros01c9573f32019-06-20 10:30:17 +0100152 "For QSYMM16 only tanh and logistic are supported");
Michalis Spyrou8d4d1b82019-11-28 11:31:23 +0000153 ARM_COMPUTE_RETURN_ERROR_ON((data_type == DataType::QASYMM8 || data_type == DataType::QASYMM16) && (f_act == ActivationLayerInfo::ActivationFunction::TANH)
154 && (oq_info != QuantizationInfo(1.f / 128.f, 128)));
155 ARM_COMPUTE_RETURN_ERROR_ON((data_type == DataType::QASYMM8 || data_type == DataType::QASYMM16) && (f_act == ActivationLayerInfo::ActivationFunction::LOGISTIC)
156 && (oq_info != QuantizationInfo(1.f / 256.f, 0)));
157
158 ARM_COMPUTE_RETURN_ERROR_ON(data_type == DataType::QASYMM8_SIGNED && (f_act == ActivationLayerInfo::ActivationFunction::TANH) && (oq_info != QuantizationInfo(1.f / 128.f, 0)));
159 ARM_COMPUTE_RETURN_ERROR_ON(data_type == DataType::QASYMM8_SIGNED && (f_act == ActivationLayerInfo::ActivationFunction::LOGISTIC) && (oq_info != QuantizationInfo(1.f / 256.f, -128)));
Georgios Pinitas4b3fba12019-06-04 17:31:46 +0100160
giuros01c9573f32019-06-20 10:30:17 +0100161 ARM_COMPUTE_RETURN_ERROR_ON(is_data_type_quantized_symmetric(data_type) && (f_act == ActivationLayerInfo::ActivationFunction::TANH) && (oq_info != QuantizationInfo(1.f / 32768.f, 0)));
162 ARM_COMPUTE_RETURN_ERROR_ON(is_data_type_quantized_symmetric(data_type) && (f_act == ActivationLayerInfo::ActivationFunction::LOGISTIC) && (oq_info != QuantizationInfo(1.f / 32768.f, 0)));
163
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000164 // Checks performed when dst is configured
165 if((dst != nullptr) && (dst->total_size() != 0))
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000166 {
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000167 ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_SHAPES(src, dst);
168 ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(src, dst);
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000169 }
170
171 return Status{};
172}
173
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000174std::pair<Status, Window> validate_and_configure_window(const ITensorInfo *src, ITensorInfo *dst)
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000175{
Georgios Pinitas5a594532018-12-03 14:30:05 +0000176 // Configure kernel window
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000177 Window win = calculate_max_window(*src, Steps());
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000178
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000179 if(dst != nullptr)
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000180 {
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000181 // dst auto inizialitation if not yet initialized
182 auto_init_if_empty(*dst, *src->clone());
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000183 }
184
Georgios Pinitas5a594532018-12-03 14:30:05 +0000185 return std::make_pair(Status{}, win);
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000186}
Pablo Marquez Tello48cfd5f2023-06-09 11:22:29 +0100187#ifdef __aarch64__
188void init_lut(ActivationLayerInfo::ActivationFunction act_func, DataType data_type,
189 const UniformQuantizationInfo &qi_in, const UniformQuantizationInfo &qi_out,
190 ActivationLayerInfo::LookupTable256 &lut, float a, float b)
191{
192 for(size_t i = 0; i < lut.size(); ++i)
193 {
194 float tmp_f = (data_type == DataType::QASYMM8) ? dequantize_qasymm8(i, qi_in) : dequantize_qasymm8_signed(i, qi_in);
195 switch(act_func)
196 {
197 case ActivationLayerInfo::ActivationFunction::HARD_SWISH:
198 tmp_f = tmp_f * ((std::min(std::max((tmp_f + 3), 0.0f), 6.0f)) * 0.166666667f);
199 break;
200 case ActivationLayerInfo::ActivationFunction::LEAKY_RELU:
201 tmp_f = tmp_f > 0 ? tmp_f : tmp_f * a;
202 break;
203 case ActivationLayerInfo::ActivationFunction::LOGISTIC:
204 tmp_f = 1.f / (1.f + std::exp(-tmp_f));
205 break;
206 case ActivationLayerInfo::ActivationFunction::ABS:
207 tmp_f = std::abs(tmp_f);
208 break;
209 case ActivationLayerInfo::ActivationFunction::LINEAR:
210 tmp_f = a * tmp_f + b;
211 break;
212 case ActivationLayerInfo::ActivationFunction::RELU:
213 tmp_f = std::max<>(0.f, tmp_f);
214 break;
215 case ActivationLayerInfo::ActivationFunction::BOUNDED_RELU:
216 tmp_f = std::min<>(a, std::max(0.f, tmp_f));
217 break;
218 case ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU:
219 tmp_f = std::min<>(a, std::max<>(b, tmp_f));
220 break;
221 case ActivationLayerInfo::ActivationFunction::SOFT_RELU:
222 tmp_f = (tmp_f > 12.f) ? tmp_f : std::log(1.f + std::exp(tmp_f));
223 break;
224 case ActivationLayerInfo::ActivationFunction::ELU:
225 tmp_f = (tmp_f >= 0) ? tmp_f : a * (std::exp(tmp_f) - 1);
226 break;
227 case ActivationLayerInfo::ActivationFunction::SQRT:
228 tmp_f = std::sqrt(tmp_f);
229 break;
230 case ActivationLayerInfo::ActivationFunction::SQUARE:
231 tmp_f = tmp_f * tmp_f;
232 break;
233 case ActivationLayerInfo::ActivationFunction::TANH:
234 tmp_f = a * std::tanh(b * tmp_f);
235 break;
236 case ActivationLayerInfo::ActivationFunction::IDENTITY:
237 break;
238 case ActivationLayerInfo::ActivationFunction::SWISH:
239 tmp_f = tmp_f / (1.f + std::exp(-a * tmp_f));
240 break;
241 case ActivationLayerInfo::ActivationFunction::GELU:
242 tmp_f = tmp_f * (0.5f * (1.0f + erff(tmp_f / 1.41421356237f)));
243 break;
244 default:
245 ARM_COMPUTE_ERROR("Not supported");
246 tmp_f = 0;
247 break;
248 }
249 lut[i] = (data_type == DataType::QASYMM8) ? quantize_qasymm8(tmp_f, qi_out) : quantize_qasymm8_signed(tmp_f, qi_out);
250 }
251}
252#endif // __aarch64__
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000253} // namespace
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100254
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000255void CpuActivationKernel::configure(const ITensorInfo *src, ITensorInfo *dst, ActivationLayerInfo activation_info)
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100256{
Mohammed Suhail Munshifa79fda2022-09-20 11:49:23 +0100257 ARM_COMPUTE_UNUSED(dst);
Michalis Spyrou60c3b0e2021-04-08 12:02:58 +0100258 ARM_COMPUTE_ERROR_ON_NULLPTR(src);
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000259 ARM_COMPUTE_ERROR_THROW_ON(validate_arguments(src, dst, activation_info));
Michel Iwaniec5dfeae62017-11-29 10:48:23 +0000260
Pablo Marquez Tellod1586092022-06-10 14:37:10 +0100261 const auto uk = CpuActivationKernel::get_implementation(ActivationDataTypeISASelectorData{ src->data_type(), CPUInfo::get().get_cpu_model(), CPUInfo::get().get_isa(), activation_info.activation() });
Mohammed Suhail Munshifa79fda2022-09-20 11:49:23 +0100262 if(dst != nullptr)
263 {
264 // dst auto inizialitation if not yet initialized
265 auto_init_if_empty(*dst, *src->clone());
266 }
Giorgio Arena5ae8d802021-11-18 18:02:13 +0000267
Georgios Pinitas5fdde992021-06-25 05:42:57 +0100268 ARM_COMPUTE_ERROR_ON_NULLPTR(uk);
269
Georgios Pinitas5fdde992021-06-25 05:42:57 +0100270 _run_method = uk->ukernel;
271 _name = std::string("CpuActivationKernel").append("/").append(uk->name);
272
Viet-Hoa Dob042e392022-06-21 15:56:15 +0100273#ifdef __aarch64__
Pablo Marquez Tello48cfd5f2023-06-09 11:22:29 +0100274 if(src->data_type() == DataType::QASYMM8 || src->data_type() == DataType::QASYMM8_SIGNED)
Pablo Marquez Tellod75cd8a2022-05-26 14:19:39 +0100275 {
Pablo Marquez Tello48cfd5f2023-06-09 11:22:29 +0100276 ActivationLayerInfo::LookupTable256 tmp_lut;
277 init_lut(activation_info.activation(), src->data_type(), src->quantization_info().uniform(), (dst) ? dst->quantization_info().uniform() : src->quantization_info().uniform(),
278 tmp_lut, activation_info.a(), activation_info.b());
279 activation_info.setLookupTable256(tmp_lut);
Pablo Marquez Tellod75cd8a2022-05-26 14:19:39 +0100280 }
Viet-Hoa Dob042e392022-06-21 15:56:15 +0100281#endif // __aarch64__
Pablo Marquez Tellod75cd8a2022-05-26 14:19:39 +0100282 _act_info = activation_info;
283
Mohammed Suhail Munshifa79fda2022-09-20 11:49:23 +0100284 Window win;
285
Viet-Hoa Do0a36f582022-10-18 15:23:46 +0100286 // Use squashed window
287 std::tie(win, _split_dimension) = calculate_squashed_or_max_window(*src);
288 ICPPKernel::configure(win);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100289}
290
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000291Status CpuActivationKernel::validate(const ITensorInfo *src, const ITensorInfo *dst, const ActivationLayerInfo &act_info)
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000292{
293 ARM_COMPUTE_UNUSED(act_info);
Michele Di Giorgiobd2c8e12021-01-19 15:29:02 +0000294 ARM_COMPUTE_RETURN_ON_ERROR(validate_arguments(src, dst, act_info));
295 ARM_COMPUTE_RETURN_ON_ERROR(validate_and_configure_window(src->clone().get(), (dst != nullptr) ? dst->clone().get() : nullptr).first);
Michalis Spyrouafa5d812017-11-30 14:25:57 +0000296
297 return Status{};
298}
299
Dana Zlotnik4cdd6b82021-10-07 15:31:54 +0300300size_t CpuActivationKernel::get_mws(const CPUInfo &platform, size_t thread_count) const
301{
Dana Zlotnikd7154db2021-11-10 11:50:58 +0200302 ARM_COMPUTE_UNUSED(thread_count);
Mohammed Suhail Munshi066607f2022-01-19 12:22:50 +0000303 ARM_COMPUTE_UNUSED(platform);
304
Mohammed Suhail Munshi8307ecf2022-11-09 15:38:54 +0000305 if(_split_dimension == Window::DimX)
306 {
307 // Don't split the work load too small if the tensor has been reinterpreted as 1D.
308 // This number is loosely chosen as threading overhead in each platform varies wildly.
309 return 1536;
310 }
311 return default_mws;
Dana Zlotnik4cdd6b82021-10-07 15:31:54 +0300312}
313
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000314void CpuActivationKernel::run_op(ITensorPack &tensors, const Window &window, const ThreadInfo &info)
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100315{
Georgios Pinitas48b3ef82019-10-14 19:03:09 +0100316 // Early exit on disabled activation
317 if(!_act_info.enabled())
318 {
319 return;
320 }
321
Moritz Pflanzerc186b572017-09-07 09:48:04 +0100322 ARM_COMPUTE_UNUSED(info);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100323 ARM_COMPUTE_ERROR_ON_UNCONFIGURED_KERNEL(this);
Gian Marco Iodiceb30dcc52017-06-20 09:07:21 +0100324 ARM_COMPUTE_ERROR_ON_INVALID_SUBWINDOW(IKernel::window(), window);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100325
Georgios Pinitas0499dff2020-07-31 22:21:38 +0100326 ARM_COMPUTE_ERROR_ON(tensors.empty());
Georgios Pinitas5fdde992021-06-25 05:42:57 +0100327 ARM_COMPUTE_ERROR_ON(_run_method == nullptr);
Georgios Pinitas1fd2c802020-06-16 17:44:46 +0100328
Michalis Spyrouc4d45552020-10-19 12:41:30 +0100329 const ITensor *src = tensors.get_const_tensor(TensorType::ACL_SRC);
330 ITensor *dst = tensors.get_tensor(TensorType::ACL_DST);
331
Georgios Pinitas5fdde992021-06-25 05:42:57 +0100332 _run_method(src, dst, _act_info, window);
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100333}
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000334
335const char *CpuActivationKernel::name() const
336{
Georgios Pinitas5fdde992021-06-25 05:42:57 +0100337 return _name.c_str();
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000338}
Giorgio Arena5ae8d802021-11-18 18:02:13 +0000339
340const std::vector<CpuActivationKernel::ActivationKernel> &CpuActivationKernel::get_available_kernels()
341{
342 return available_kernels;
343}
Georgios Pinitasf8f04422021-01-08 17:25:55 +0000344} // namespace kernels
345} // namespace cpu
Michele Di Giorgiof9b595a2020-07-03 13:34:52 +0100346} // namespace arm_compute