Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 1 | |
Jerry Ge | 51bd4f5 | 2024-02-20 11:21:19 -0800 | [diff] [blame] | 2 | // Copyright (c) 2020-2024, ARM Limited. |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 3 | // |
| 4 | // Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | // you may not use this file except in compliance with the License. |
| 6 | // You may obtain a copy of the License at |
| 7 | // |
| 8 | // http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | // |
| 10 | // Unless required by applicable law or agreed to in writing, software |
| 11 | // distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | // See the License for the specific language governing permissions and |
| 14 | // limitations under the License. |
| 15 | |
| 16 | #include "ewise_unary.h" |
| 17 | #include "quant_util.h" |
| 18 | #include "template_types.h" |
| 19 | #include <cmath> |
| 20 | |
| 21 | using namespace TosaReference; |
| 22 | using namespace Eigen; |
| 23 | using namespace tosa; |
| 24 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 25 | template <int Rank, TOSA_REF_TYPE Dtype> |
Kevin Cheng | acb550f | 2021-06-29 15:32:19 -0700 | [diff] [blame] | 26 | UnaryNode<Rank, Dtype>::UnaryNode(SubgraphTraverser* sgt_, const Op& op_, uint64_t id_) |
| 27 | : GraphNode(sgt_, op_, id_) |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 28 | { |
| 29 | setRequiredOperands(1, 1); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 30 | |
Eric Kunze | b5fabec | 2022-06-07 05:20:44 +0000 | [diff] [blame] | 31 | fcn = [](InEigenType a) -> OutEigenType { |
| 32 | ASSERT_MSG(0, "In default UnaryNode function, missing function registration"); |
| 33 | return OutEigenType(); |
| 34 | }; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 35 | } |
| 36 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 37 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 38 | UnaryNode<Rank, Dtype>::~UnaryNode() |
| 39 | {} |
| 40 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 41 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 42 | int UnaryNode<Rank, Dtype>::checkTensorAttributes() |
| 43 | { |
Jerry Ge | a793f46 | 2023-04-11 00:05:02 +0000 | [diff] [blame] | 44 | // Check Tosa Level |
| 45 | auto tosa_level = g_func_config.tosa_level; |
| 46 | LEVEL_CHECK(Rank <= tosa_level.MAX_RANK, "Rank should be smaller than or equal to MAX_RANK"); |
| 47 | |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 48 | if (validateRequiredOperands()) |
| 49 | return 1; |
| 50 | |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 51 | // output and input must be the same types |
Kevin Cheng | c72b59c | 2021-09-29 16:57:55 -0700 | [diff] [blame] | 52 | if (inputs[0]->matchRankTypeShape(*outputs[0])) |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 53 | { |
Kevin Cheng | c72b59c | 2021-09-29 16:57:55 -0700 | [diff] [blame] | 54 | printNodeValidationError("UnaryNode: input and output rank/type/shape must match"); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 55 | return 1; |
| 56 | } |
| 57 | |
| 58 | a = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]); |
| 59 | result = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]); |
| 60 | |
| 61 | ASSERT_MEM(a && result); |
| 62 | |
| 63 | return 0; |
| 64 | } |
| 65 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 66 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 67 | int UnaryNode<Rank, Dtype>::eval() |
| 68 | { |
Tai Ly | 5d0e9c7 | 2024-04-05 01:19:31 +0000 | [diff] [blame] | 69 | // call register_fcn() here to ensure inputs/outputs have been connected |
| 70 | // to the node by the time register_fcn() is called for Clamp Operator |
| 71 | if (register_fcn()) |
| 72 | { |
| 73 | return 1; |
| 74 | } |
| 75 | |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 76 | this->result->getTensor() = this->a->getTensor().unaryExpr(this->fcn); |
| 77 | |
| 78 | return GraphNode::eval(); |
| 79 | } |
| 80 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 81 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 82 | int OpAbs<Rank, Dtype>::register_fcn() |
| 83 | { |
| 84 | switch (Dtype) |
| 85 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 86 | case TOSA_REF_TYPE_FP32: // No fpTrunc for FP32 as it is a no-op |
| 87 | case TOSA_REF_TYPE_FP64: |
| 88 | case TOSA_REF_TYPE_INT32: |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 89 | this->fcn = [](InEigenType a) -> OutEigenType { return a > (InEigenType)0 ? a : (-a); }; |
| 90 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 91 | case TOSA_REF_TYPE_FP16: |
| 92 | case TOSA_REF_TYPE_BF16: |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 93 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(a > (InEigenType)0 ? a : (-a)); }; |
| 94 | break; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 95 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 96 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 97 | } |
| 98 | |
| 99 | return 0; |
| 100 | } |
| 101 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 102 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 103 | int OpBitwiseNot<Rank, Dtype>::register_fcn() |
| 104 | { |
| 105 | switch (Dtype) |
| 106 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 107 | case TOSA_REF_TYPE_INT8: |
| 108 | case TOSA_REF_TYPE_INT16: |
| 109 | case TOSA_REF_TYPE_INT32: |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 110 | this->fcn = [](InEigenType a) -> OutEigenType { return ~a; }; |
| 111 | break; |
| 112 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 113 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 114 | } |
| 115 | |
| 116 | return 0; |
| 117 | } |
| 118 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 119 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 120 | int OpCeil<Rank, Dtype>::register_fcn() |
| 121 | { |
| 122 | switch (Dtype) |
| 123 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 124 | case TOSA_REF_TYPE_FP16: |
| 125 | case TOSA_REF_TYPE_BF16: |
| 126 | case TOSA_REF_TYPE_FP32: |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 127 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(ceilf(a)); }; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 128 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 129 | case TOSA_REF_TYPE_FP64: |
| 130 | this->fcn = [](InEigenType a) -> OutEigenType { return ceil(a); }; |
| 131 | break; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 132 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 133 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 134 | } |
| 135 | |
| 136 | return 0; |
| 137 | } |
| 138 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 139 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 140 | int OpClz<Rank, Dtype>::register_fcn() |
| 141 | { |
| 142 | int32_t num_bits; |
| 143 | switch (Dtype) |
| 144 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 145 | case TOSA_REF_TYPE_INT32: |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 146 | num_bits = 32; |
| 147 | break; |
| 148 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 149 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 150 | } |
| 151 | |
| 152 | this->fcn = [num_bits](int32_t a) -> int32_t { |
| 153 | int32_t leading_zeros = 0; |
| 154 | for (int bit = num_bits - 1; bit >= 0; bit--) |
| 155 | { |
| 156 | if (((a >> bit) & 0x1) == 0) |
| 157 | { |
| 158 | leading_zeros++; |
| 159 | } |
| 160 | else |
| 161 | { |
| 162 | break; |
| 163 | } |
| 164 | } |
| 165 | return leading_zeros; |
| 166 | }; |
| 167 | |
| 168 | return 0; |
| 169 | } |
| 170 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 171 | template <int Rank, TOSA_REF_TYPE Dtype> |
Jerry Ge | 51bd4f5 | 2024-02-20 11:21:19 -0800 | [diff] [blame] | 172 | int OpCos<Rank, Dtype>::register_fcn() |
| 173 | { |
| 174 | switch (Dtype) |
| 175 | { |
| 176 | case TOSA_REF_TYPE_FP16: |
| 177 | case TOSA_REF_TYPE_BF16: |
| 178 | case TOSA_REF_TYPE_FP32: |
| 179 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(cos(a)); }; |
| 180 | break; |
| 181 | case TOSA_REF_TYPE_FP64: |
| 182 | if (g_func_config.abs_mode) |
| 183 | { |
Jeremy Johnson | 1eb1455 | 2024-04-11 16:21:54 +0100 | [diff] [blame^] | 184 | // ABS_ERROR bounds return |
| 185 | this->fcn = [](InEigenType a) -> OutEigenType { return a; }; |
Jerry Ge | 51bd4f5 | 2024-02-20 11:21:19 -0800 | [diff] [blame] | 186 | } |
| 187 | else |
| 188 | { |
| 189 | this->fcn = [](InEigenType a) -> OutEigenType { return cos(a); }; |
| 190 | }; |
| 191 | break; |
| 192 | default: |
| 193 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
| 194 | } |
| 195 | |
| 196 | return 0; |
| 197 | } |
| 198 | |
| 199 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 200 | int OpExp<Rank, Dtype>::register_fcn() |
| 201 | { |
| 202 | switch (Dtype) |
| 203 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 204 | case TOSA_REF_TYPE_FP16: |
| 205 | case TOSA_REF_TYPE_BF16: |
| 206 | case TOSA_REF_TYPE_FP32: |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 207 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(expf(a)); }; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 208 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 209 | case TOSA_REF_TYPE_FP64: |
Jeremy Johnson | 9a75838 | 2023-11-07 16:27:35 +0000 | [diff] [blame] | 210 | if (g_func_config.abs_mode) |
| 211 | { |
| 212 | // ABS_ERROR bounds return (1+abs(a)) |
| 213 | this->fcn = [](InEigenType a) -> OutEigenType { return 1.0 + (a > (InEigenType)0 ? a : (-a)); }; |
| 214 | } |
| 215 | else |
| 216 | { |
| 217 | this->fcn = [](InEigenType a) -> OutEigenType { return exp(a); }; |
| 218 | } |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 219 | break; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 220 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 221 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 222 | } |
| 223 | |
| 224 | return 0; |
| 225 | } |
| 226 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 227 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 228 | int OpFloor<Rank, Dtype>::register_fcn() |
| 229 | { |
| 230 | switch (Dtype) |
| 231 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 232 | case TOSA_REF_TYPE_FP16: |
| 233 | case TOSA_REF_TYPE_BF16: |
| 234 | case TOSA_REF_TYPE_FP32: |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 235 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(floorf(a)); }; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 236 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 237 | case TOSA_REF_TYPE_FP64: |
| 238 | this->fcn = [](InEigenType a) -> OutEigenType { return floor(a); }; |
| 239 | break; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 240 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 241 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 242 | } |
| 243 | |
| 244 | return 0; |
| 245 | } |
| 246 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 247 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 248 | int OpLog<Rank, Dtype>::register_fcn() |
| 249 | { |
| 250 | switch (Dtype) |
| 251 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 252 | case TOSA_REF_TYPE_FP16: |
| 253 | case TOSA_REF_TYPE_BF16: |
| 254 | case TOSA_REF_TYPE_FP32: |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 255 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(logf(a)); }; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 256 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 257 | case TOSA_REF_TYPE_FP64: |
| 258 | this->fcn = [](InEigenType a) -> OutEigenType { return log(a); }; |
| 259 | break; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 260 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 261 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 262 | } |
| 263 | |
| 264 | return 0; |
| 265 | } |
| 266 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 267 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 268 | int OpLogicalNot<Rank, Dtype>::register_fcn() |
| 269 | { |
| 270 | switch (Dtype) |
| 271 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 272 | case TOSA_REF_TYPE_BOOL: |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 273 | this->fcn = [](InEigenType a) -> OutEigenType { return !a; }; |
| 274 | break; |
| 275 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 276 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 277 | } |
| 278 | |
| 279 | return 0; |
| 280 | } |
| 281 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 282 | template <int Rank, TOSA_REF_TYPE Dtype> |
Jerry Ge | 9c9c8da | 2023-07-19 23:08:16 +0000 | [diff] [blame] | 283 | OpNegate<Rank, Dtype>::OpNegate(SubgraphTraverser* sgt_, TosaAttributeBase* attribute_, uint64_t id_) |
Eric Kunze | b5fabec | 2022-06-07 05:20:44 +0000 | [diff] [blame] | 284 | : UnaryNode<Rank, Dtype>(sgt_, Op_NEGATE, id_) |
| 285 | { |
| 286 | INIT_ATTRIBUTE(Negate); |
| 287 | |
| 288 | register_fcn(); |
| 289 | } |
| 290 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 291 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | b5fabec | 2022-06-07 05:20:44 +0000 | [diff] [blame] | 292 | OpNegate<Rank, Dtype>::~OpNegate() |
| 293 | { |
| 294 | if (attribute) |
| 295 | delete attribute; |
| 296 | } |
| 297 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 298 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 299 | int OpNegate<Rank, Dtype>::register_fcn() |
| 300 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 301 | ERROR_IF(Dtype != TOSA_REF_TYPE_INT8 && attribute->input1_zp() != 0, "OpNegate: zeropoint only for int8_t"); |
| 302 | ERROR_IF(Dtype != TOSA_REF_TYPE_INT8 && attribute->output_zp() != 0, "OpNegate: zeropoint only for int8_t"); |
Kevin Cheng | acb550f | 2021-06-29 15:32:19 -0700 | [diff] [blame] | 303 | |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 304 | switch (Dtype) |
| 305 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 306 | case TOSA_REF_TYPE_FP16: |
| 307 | case TOSA_REF_TYPE_BF16: |
| 308 | case TOSA_REF_TYPE_FP32: |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 309 | this->fcn = [](InEigenType a) -> OutEigenType { |
| 310 | InEigenType result = -(a); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 311 | return fpTrunc<Dtype>(result); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 312 | }; |
| 313 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 314 | case TOSA_REF_TYPE_FP64: |
| 315 | this->fcn = [](InEigenType a) -> OutEigenType { |
| 316 | OutEigenType result = -(a); |
| 317 | return result; |
| 318 | }; |
| 319 | break; |
| 320 | case TOSA_REF_TYPE_INT16: |
| 321 | case TOSA_REF_TYPE_INT32: |
Jeremy Johnson | 81ee53d | 2022-03-23 15:32:34 +0000 | [diff] [blame] | 322 | this->fcn = [this](InEigenType a) -> OutEigenType { |
Jerry Ge | 9c9c8da | 2023-07-19 23:08:16 +0000 | [diff] [blame] | 323 | int64_t res_in_64 = 0L - a; |
Jeremy Johnson | 0e46364 | 2022-05-03 12:10:23 +0100 | [diff] [blame] | 324 | int64_t i32_max_in_64 = static_cast<int64_t>(std::numeric_limits<int32_t>::max()); |
| 325 | int64_t i32_min_in_64 = static_cast<int64_t>(std::numeric_limits<int32_t>::min()); |
Jerry Ge | 9c9c8da | 2023-07-19 23:08:16 +0000 | [diff] [blame] | 326 | REQUIRE(res_in_64 <= i32_max_in_64 && res_in_64 >= i32_min_in_64, |
| 327 | "OpNegate: result not in acc type range (int32)"); |
Jeremy Johnson | 0e46364 | 2022-05-03 12:10:23 +0100 | [diff] [blame] | 328 | |
| 329 | int64_t max_clip_in_64, min_clip_in_64; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 330 | if (Dtype == TOSA_REF_TYPE_INT16) |
Jeremy Johnson | 0e46364 | 2022-05-03 12:10:23 +0100 | [diff] [blame] | 331 | { |
| 332 | max_clip_in_64 = static_cast<int64_t>(std::numeric_limits<int16_t>::max()); |
| 333 | min_clip_in_64 = static_cast<int64_t>(std::numeric_limits<int16_t>::min()); |
Jeremy Johnson | 81ee53d | 2022-03-23 15:32:34 +0000 | [diff] [blame] | 334 | } |
| 335 | else |
| 336 | { |
Jeremy Johnson | 0e46364 | 2022-05-03 12:10:23 +0100 | [diff] [blame] | 337 | max_clip_in_64 = i32_max_in_64; |
| 338 | min_clip_in_64 = i32_min_in_64; |
Jeremy Johnson | 81ee53d | 2022-03-23 15:32:34 +0000 | [diff] [blame] | 339 | } |
Jerry Ge | 9c9c8da | 2023-07-19 23:08:16 +0000 | [diff] [blame] | 340 | return static_cast<InEigenType>( |
| 341 | std::min<int64_t>(max_clip_in_64, std::max<int64_t>(min_clip_in_64, res_in_64))); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 342 | }; |
| 343 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 344 | case TOSA_REF_TYPE_INT8: |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 345 | this->fcn = [this](InEigenType a) -> OutEigenType { |
Jerry Ge | 9c9c8da | 2023-07-19 23:08:16 +0000 | [diff] [blame] | 346 | int64_t res_in_64 = 0 - (a - attribute->input1_zp()); |
Jeremy Johnson | 0e46364 | 2022-05-03 12:10:23 +0100 | [diff] [blame] | 347 | int64_t i32_max_in_64 = static_cast<int64_t>(std::numeric_limits<int32_t>::max()); |
| 348 | int64_t i32_min_in_64 = static_cast<int64_t>(std::numeric_limits<int32_t>::min()); |
Jerry Ge | 9c9c8da | 2023-07-19 23:08:16 +0000 | [diff] [blame] | 349 | REQUIRE(res_in_64 <= i32_max_in_64 && res_in_64 >= i32_min_in_64, |
| 350 | "OpNegate: result not in acc type range (int32)"); |
Eric Kunze | b5fabec | 2022-06-07 05:20:44 +0000 | [diff] [blame] | 351 | res_in_64 += attribute->output_zp(); |
Jerry Ge | 9c9c8da | 2023-07-19 23:08:16 +0000 | [diff] [blame] | 352 | InEigenType result = static_cast<InEigenType>( |
| 353 | std::min(std::max(res_in_64, static_cast<int64_t>(QMin)), static_cast<int64_t>(QMax))); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 354 | return result; |
| 355 | }; |
| 356 | break; |
| 357 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 358 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 359 | } |
| 360 | |
| 361 | return 0; |
| 362 | } |
| 363 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 364 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 365 | int OpReciprocal<Rank, Dtype>::register_fcn() |
| 366 | { |
| 367 | switch (Dtype) |
| 368 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 369 | case TOSA_REF_TYPE_FP16: |
| 370 | case TOSA_REF_TYPE_BF16: |
| 371 | case TOSA_REF_TYPE_FP32: |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 372 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(1.0 / a); }; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 373 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 374 | case TOSA_REF_TYPE_FP64: |
| 375 | this->fcn = [](InEigenType a) -> OutEigenType { return (1.0L / a); }; |
| 376 | break; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 377 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 378 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 379 | } |
| 380 | |
| 381 | return 0; |
| 382 | } |
| 383 | |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 384 | template <int Rank, TOSA_REF_TYPE Dtype> |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 385 | int OpRsqrt<Rank, Dtype>::register_fcn() |
| 386 | { |
| 387 | switch (Dtype) |
| 388 | { |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 389 | case TOSA_REF_TYPE_FP16: |
| 390 | case TOSA_REF_TYPE_BF16: |
| 391 | case TOSA_REF_TYPE_FP32: |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 392 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(1.0 / sqrtf(a)); }; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 393 | break; |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 394 | case TOSA_REF_TYPE_FP64: |
| 395 | this->fcn = [](InEigenType a) -> OutEigenType { return (1.0L / sqrt(a)); }; |
| 396 | break; |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 397 | default: |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 398 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 399 | } |
| 400 | |
| 401 | return 0; |
| 402 | } |
| 403 | |
Jerry Ge | 51bd4f5 | 2024-02-20 11:21:19 -0800 | [diff] [blame] | 404 | template <int Rank, TOSA_REF_TYPE Dtype> |
| 405 | int OpSin<Rank, Dtype>::register_fcn() |
| 406 | { |
| 407 | switch (Dtype) |
| 408 | { |
| 409 | case TOSA_REF_TYPE_FP16: |
| 410 | case TOSA_REF_TYPE_BF16: |
| 411 | case TOSA_REF_TYPE_FP32: |
| 412 | this->fcn = [](InEigenType a) -> OutEigenType { return fpTrunc<Dtype>(sin(a)); }; |
| 413 | break; |
| 414 | case TOSA_REF_TYPE_FP64: |
| 415 | if (g_func_config.abs_mode) |
| 416 | { |
Jeremy Johnson | 1eb1455 | 2024-04-11 16:21:54 +0100 | [diff] [blame^] | 417 | // ABS_ERROR bounds return |
| 418 | this->fcn = [](InEigenType a) -> OutEigenType { return a; }; |
Jerry Ge | 51bd4f5 | 2024-02-20 11:21:19 -0800 | [diff] [blame] | 419 | } |
| 420 | else |
| 421 | { |
| 422 | this->fcn = [](InEigenType a) -> OutEigenType { return sin(a); }; |
| 423 | }; |
| 424 | break; |
| 425 | default: |
| 426 | ERROR_IF(true, "unsupported TOSA_REF_TYPE %s", EnumNameTOSAREFTYPE(Dtype)); |
| 427 | } |
| 428 | |
| 429 | return 0; |
| 430 | } |
| 431 | |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 432 | // template explicit instantiation |
Jared Smolens | 98c281f | 2022-12-20 15:09:25 -0800 | [diff] [blame] | 433 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(UnaryNode, BOOL); |
| 434 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(UnaryNode, FP16); |
| 435 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(UnaryNode, BF16); |
| 436 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(UnaryNode, FP32); |
| 437 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(UnaryNode, INT8); |
| 438 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(UnaryNode, INT16); |
| 439 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(UnaryNode, INT32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 440 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(UnaryNode, FP64); |
Jared Smolens | 98c281f | 2022-12-20 15:09:25 -0800 | [diff] [blame] | 441 | |
James Ward | 8b39043 | 2022-08-12 20:48:56 +0100 | [diff] [blame] | 442 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpAbs, FP16); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 443 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpAbs, BF16); |
Jeremy Johnson | bc2a3db | 2022-09-27 13:50:00 +0100 | [diff] [blame] | 444 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpAbs, FP32); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 445 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpAbs, INT32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 446 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpAbs, FP64); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 447 | |
Kevin Cheng | 3a47857 | 2021-01-22 17:21:02 -0800 | [diff] [blame] | 448 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpBitwiseNot, INT8); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 449 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpBitwiseNot, INT16); |
| 450 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpBitwiseNot, INT32); |
| 451 | |
James Ward | 8b39043 | 2022-08-12 20:48:56 +0100 | [diff] [blame] | 452 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpCeil, FP16); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 453 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpCeil, BF16); |
Jeremy Johnson | bc2a3db | 2022-09-27 13:50:00 +0100 | [diff] [blame] | 454 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpCeil, FP32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 455 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpCeil, FP64); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 456 | |
| 457 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpClz, INT32); |
| 458 | |
Jerry Ge | 51bd4f5 | 2024-02-20 11:21:19 -0800 | [diff] [blame] | 459 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpCos, FP16); |
| 460 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpCos, BF16); |
| 461 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpCos, FP32); |
| 462 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpCos, FP64); |
| 463 | |
James Ward | 8b39043 | 2022-08-12 20:48:56 +0100 | [diff] [blame] | 464 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpExp, FP16); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 465 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpExp, BF16); |
Jeremy Johnson | bc2a3db | 2022-09-27 13:50:00 +0100 | [diff] [blame] | 466 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpExp, FP32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 467 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpExp, FP64); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 468 | |
James Ward | 8b39043 | 2022-08-12 20:48:56 +0100 | [diff] [blame] | 469 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpFloor, FP16); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 470 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpFloor, BF16); |
Jeremy Johnson | bc2a3db | 2022-09-27 13:50:00 +0100 | [diff] [blame] | 471 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpFloor, FP32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 472 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpFloor, FP64); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 473 | |
James Ward | 8b39043 | 2022-08-12 20:48:56 +0100 | [diff] [blame] | 474 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpLog, FP16); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 475 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpLog, BF16); |
Jeremy Johnson | bc2a3db | 2022-09-27 13:50:00 +0100 | [diff] [blame] | 476 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpLog, FP32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 477 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpLog, FP64); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 478 | |
| 479 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpLogicalNot, BOOL); |
| 480 | |
James Ward | 8b39043 | 2022-08-12 20:48:56 +0100 | [diff] [blame] | 481 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpNegate, FP16); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 482 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpNegate, BF16); |
Jeremy Johnson | bc2a3db | 2022-09-27 13:50:00 +0100 | [diff] [blame] | 483 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpNegate, FP32); |
Kevin Cheng | 3a47857 | 2021-01-22 17:21:02 -0800 | [diff] [blame] | 484 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpNegate, INT8); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 485 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpNegate, INT16); |
| 486 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpNegate, INT32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 487 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpNegate, FP64); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 488 | |
James Ward | 8b39043 | 2022-08-12 20:48:56 +0100 | [diff] [blame] | 489 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpRsqrt, FP16); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 490 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpRsqrt, BF16); |
Jeremy Johnson | bc2a3db | 2022-09-27 13:50:00 +0100 | [diff] [blame] | 491 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpRsqrt, FP32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 492 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpRsqrt, FP64); |
Eric Kunze | e5e2676 | 2020-10-13 16:11:07 -0700 | [diff] [blame] | 493 | |
Jerry Ge | 51bd4f5 | 2024-02-20 11:21:19 -0800 | [diff] [blame] | 494 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpSin, FP16); |
| 495 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpSin, BF16); |
| 496 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpSin, FP32); |
| 497 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpSin, FP64); |
| 498 | |
James Ward | 8b39043 | 2022-08-12 20:48:56 +0100 | [diff] [blame] | 499 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpReciprocal, FP16); |
James Ward | 24dbc42 | 2022-10-19 12:20:31 +0100 | [diff] [blame] | 500 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpReciprocal, BF16); |
Jeremy Johnson | bc2a3db | 2022-09-27 13:50:00 +0100 | [diff] [blame] | 501 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpReciprocal, FP32); |
Tai Ly | a4d748b | 2023-03-28 22:06:56 +0000 | [diff] [blame] | 502 | DEF_INSTANTIATE_RANK0_6_ONE_RANK_ONE_TYPE(OpReciprocal, FP64); |