blob: fd71f3ed4d0a7eff57610c54708f670007053249 [file] [log] [blame]
Anthony Barbier6ff3b192017-09-04 18:44:23 +01001/*
Michele Di Giorgiod9eaf612020-07-08 11:12:57 +01002 * Copyright (c) 2017-2020 Arm Limited.
Anthony Barbier6ff3b192017-09-04 18:44:23 +01003 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Michalis Spyrouf4643372019-11-29 16:17:13 +000024#ifndef ARM_COMPUTE_CLSOFTMAXLAYER_H
25#define ARM_COMPUTE_CLSOFTMAXLAYER_H
Anthony Barbier6ff3b192017-09-04 18:44:23 +010026
27#include "arm_compute/core/CL/kernels/CLSoftmaxLayerKernel.h"
28#include "arm_compute/runtime/CL/CLTensor.h"
SiCong Li96209c72020-08-21 12:28:30 +010029#include "arm_compute/runtime/CL/functions/CLPermute.h"
Anthony Barbier6ff3b192017-09-04 18:44:23 +010030#include "arm_compute/runtime/IFunction.h"
Georgios Pinitasbaf174e2017-09-08 19:47:30 +010031#include "arm_compute/runtime/IMemoryManager.h"
Georgios Pinitas26014cf2019-09-09 19:00:57 +010032#include "arm_compute/runtime/MemoryGroup.h"
Georgios Pinitasbaf174e2017-09-08 19:47:30 +010033
34#include <memory>
Anthony Barbier6ff3b192017-09-04 18:44:23 +010035
36namespace arm_compute
37{
38class ICLTensor;
39
40/** Basic function to compute a SoftmaxLayer.
41 *
42 * Softmax is calculated by :
Georgios Pinitas388d3ec2017-11-02 12:17:56 +000043 * @f[ out = exp((x - max(x)) * beta) / sum(exp((x - max(x)) * beta)) @f]
Anthony Barbier6ff3b192017-09-04 18:44:23 +010044 *
Sang-Hoon Park62eeb532019-10-29 13:13:19 +000045 * Log Softmax is calculated by :
Sang-Hoon Parka0205b92020-07-07 09:36:09 +010046 * @f[ out = (x - max(x) * beta) - log(\sum{e^{x - max(x) * beta}}) @f]
Sang-Hoon Park62eeb532019-10-29 13:13:19 +000047 *
Anthony Barbier6ff3b192017-09-04 18:44:23 +010048 * This function runs the following kernels:
SiCong Li96209c72020-08-21 12:28:30 +010049 * -# If axis is not 0:
50 * -# @ref CLPermute
Anthony Barbier6ff3b192017-09-04 18:44:23 +010051 * -# @ref CLLogits1DNormKernel
SiCong Li96209c72020-08-21 12:28:30 +010052 * -# @ref CLLogits1DMaxShiftExpSumKernel
Anthony Barbier6ff3b192017-09-04 18:44:23 +010053 */
Sang-Hoon Park62eeb532019-10-29 13:13:19 +000054template <bool IS_LOG = false>
55class CLSoftmaxLayerGeneric : public IFunction
Anthony Barbier6ff3b192017-09-04 18:44:23 +010056{
57public:
58 /** Constructor */
Sang-Hoon Park62eeb532019-10-29 13:13:19 +000059 CLSoftmaxLayerGeneric(std::shared_ptr<IMemoryManager> memory_manager = nullptr);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010060 /** Set the input and output tensors.
61 *
morgolock9c7fed82020-08-05 12:30:56 +010062 * @param[in] input Source tensor. Data types supported: QASYMM8/QASYMM8_SIGNED/F16/F32 for Softmax and F16/F32 for Log Softmax
63 * @param[out] output Destination tensor. Data types supported: same as @p input
64 * @param[in] beta (Optional) A scaling factor for the exponent. Defaults to 1.f
SiCong Li96209c72020-08-21 12:28:30 +010065 * @param[in] axis (Optional) The dimension in which to apply the function. E.g. for input of shape 4x5x6 and
66 * axis=1, softmax will be applied to 4x6=24 vectors of size 5. Defaults to 0
Anthony Barbier6ff3b192017-09-04 18:44:23 +010067 */
SiCong Li96209c72020-08-21 12:28:30 +010068 void configure(const ICLTensor *input, ICLTensor *output, float beta = 1.0f, int32_t axis = 0);
Manuel Bottini2b84be52020-04-08 10:15:51 +010069 /** Set the input and output tensors.
70 *
71 * @param[in] compile_context The compile context to be used.
Michele Di Giorgiof6f78762020-07-06 11:27:21 +010072 * @param[in] input Source tensor. Data types supported: QASYMM8/QASYMM8_SIGNED/F16/F32 for Softmax and F16/F32 for Log Softmax
Manuel Bottini2b84be52020-04-08 10:15:51 +010073 * @param[out] output Destination tensor. Data types supported: same as @p input
74 * @param[in] beta (Optional) A scaling factor for the exponent. Defaults to 1.f
SiCong Li96209c72020-08-21 12:28:30 +010075 * @param[in] axis (Optional) The dimension in which to apply the function. E.g. for input of shape 4x5x6 and
76 * axis=1, softmax will be applied to 4x6=24 vectors of size 5. Defaults to 0
Manuel Bottini2b84be52020-04-08 10:15:51 +010077 */
SiCong Li96209c72020-08-21 12:28:30 +010078 void configure(const CLCompileContext &compile_context, const ICLTensor *input, ICLTensor *output, float beta = 1.0f, int32_t axis = 0);
Georgios Pinitas30902ed2017-11-14 15:32:57 +000079 /** Static function to check if given info will lead to a valid configuration of @ref CLSoftmaxLayer
80 *
morgolock9c7fed82020-08-05 12:30:56 +010081 * @param[in] input Source tensor. Data types supported: QASYMM8/QASYMM8_SIGNED/F16/F32 for Softmax and F16/F32 for Log Softmax
82 * @param[in] output Destination tensor. Data types supported: same as @p input
83 * @param[in] beta (Optional) A scaling factor for the exponent. Defaults to 1.f
SiCong Li96209c72020-08-21 12:28:30 +010084 * @param[in] axis (Optional) The dimension in which to apply the function. E.g. for input of shape 4x5x6 and
85 * axis=1, softmax will be applied to 4x6=24 vectors of size 5. Defaults to 0
morgolock9c7fed82020-08-05 12:30:56 +010086 *
Georgios Pinitas631c41a2017-12-06 11:53:03 +000087 * @return a status
Georgios Pinitas30902ed2017-11-14 15:32:57 +000088 */
SiCong Li96209c72020-08-21 12:28:30 +010089 static Status validate(const ITensorInfo *input, const ITensorInfo *output, float beta = 1.0f, int32_t axis = 0);
Anthony Barbier6ff3b192017-09-04 18:44:23 +010090
91 // Inherited methods overridden:
92 void run() override;
93
94private:
Georgios Pinitas26014cf2019-09-09 19:00:57 +010095 MemoryGroup _memory_group;
SiCong Li96209c72020-08-21 12:28:30 +010096 CLPermute _permute_input;
97 CLPermute _permute_output;
Chunosovd6afedc2017-11-06 22:09:45 +070098 CLLogits1DMaxShiftExpSumKernel _max_shift_exp_sum_kernel;
99 CLLogits1DNormKernel _norm_kernel;
100 CLTensor _max;
101 CLTensor _sum;
102 CLTensor _tmp;
SiCong Li96209c72020-08-21 12:28:30 +0100103 CLTensor _input_permuted;
104 CLTensor _output_permuted;
105 bool _needs_permute;
Anthony Barbier6ff3b192017-09-04 18:44:23 +0100106};
Sang-Hoon Park62eeb532019-10-29 13:13:19 +0000107
108using CLSoftmaxLayer = CLSoftmaxLayerGeneric<false>;
109using CLLogSoftmaxLayer = CLSoftmaxLayerGeneric<true>;
110} // namespace arm_compute
Michalis Spyrouf4643372019-11-29 16:17:13 +0000111#endif /* ARM_COMPUTE_CLSOFTMAXLAYER_H */