blob: f01a66901eb30508b9002bf3e6c3a83dff6821a3 [file] [log] [blame]
Jonas Ohlsson45e653d2021-07-26 16:13:12 +02001# Copyright (C) 2020-2021 Arm Limited or its affiliates. All rights reserved.
2#
3# SPDX-License-Identifier: Apache-2.0
4#
5# Licensed under the Apache License, Version 2.0 (the License); you may
6# not use this file except in compliance with the License.
7# You may obtain a copy of the License at
8#
9# www.apache.org/licenses/LICENSE-2.0
10#
11# Unless required by applicable law or agreed to in writing, software
12# distributed under the License is distributed on an AS IS BASIS, WITHOUT
13# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14# See the License for the specific language governing permissions and
15# limitations under the License.
16# Description:
17# The TFLiteSupportedOperators class which is a collection of all TFLite supported operators and parameter checks.
18from collections import defaultdict
19
20import numpy as np
21
22from .data_type import DataType
23from .operation import Op
24from .operation import Padding
25from .supported_operators_util import docstring_format_args
26from .supported_operators_util import list_formatter
27from .tensor import check_quantized_tens_scaling_equal
28from .tflite_mapping import BUILTIN_OPERATOR_UNKNOWN
29from .tflite_mapping import optype_to_builtintype
30
31
32def _optype_formatter(op_list):
33 # Convert internal op types to external names
34 output = map(optype_to_builtintype, op_list)
35 # Remove UNKNOWNs
36 output = (x for x in output if x is not BUILTIN_OPERATOR_UNKNOWN)
37 return list_formatter(output)
38
39
40class TFLiteSupportedOperators:
41 # Categorised lists of supported operators
Fredrik Svedberg11563172022-07-06 14:54:12 +020042 npu_pre_ops = set(
43 (
44 Op.SplitSliceRead,
45 Op.Shape,
46 )
47 )
Jonas Ohlssond8575072022-03-30 10:30:25 +020048 convolution_ops = set(
49 (
50 Op.Conv2DBias,
51 Op.Conv2D,
52 Op.QuantizedConv2D,
53 )
54 )
Jonas Ohlsson45e653d2021-07-26 16:13:12 +020055 depthwise_convolution_ops = set((Op.DepthwiseConv2DBias,))
56 transpose_convolution_ops = set((Op.Conv2DBackpropInput,))
57 convolution_like_ops = convolution_ops | depthwise_convolution_ops | transpose_convolution_ops
58 max_pooling_ops = Op.op_set(Op.is_maxpool_op)
59 avg_pooling_ops = Op.op_set(Op.is_avgpool_op)
60 pooling_ops = set((Op.ReduceSum,)) | max_pooling_ops | avg_pooling_ops
Tim Hall885033b2022-07-21 11:46:03 +010061 resizing_ops = Op.op_set(Op.is_resize_op)
Jonas Ohlssond8575072022-03-30 10:30:25 +020062 fc_vector_products = set(
63 (
64 Op.QuantizedMatMul,
65 Op.MatMul,
66 Op.FullyConnected,
67 )
68 )
Jonas Ohlsson45e653d2021-07-26 16:13:12 +020069 mac_main_ops = (
70 # RNN/LSTM/GRU
71 set((Op.BlockLSTM,))
72 # conv/depthwiseconv/transposeconv
73 | convolution_like_ops
74 # pooling
75 | pooling_ops
76 # resizing/upscaling
77 | resizing_ops
78 # FC layers
79 | fc_vector_products
80 # Mean (converts to depthwise conv)
81 | set((Op.Mean,))
82 )
83 unary_elem_wise_main_ops = Op.op_set(Op.is_unary_elementwise_op)
Jonas Ohlssond8575072022-03-30 10:30:25 +020084 binary_elem_wise_min_max_ops = set(
85 (
86 Op.Minimum,
87 Op.Maximum,
88 )
89 )
90 binary_elem_wise_shift_ops = set(
91 (
92 Op.SHL,
93 Op.SHR,
94 )
95 )
96 binary_elem_wise_add_mul_sub = set(
97 (
98 Op.Add,
99 Op.Mul,
100 Op.Sub,
101 )
102 )
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200103 binary_elem_wise_main_ops = binary_elem_wise_min_max_ops | binary_elem_wise_add_mul_sub | binary_elem_wise_shift_ops
104 elem_wise_main_ops = binary_elem_wise_main_ops | unary_elem_wise_main_ops
105 pad_ops = set((Op.Pad,))
106 supported_int32_tensor_ops = (
Jonas Ohlssond8575072022-03-30 10:30:25 +0200107 set(
108 (
109 Op.ReduceSum,
110 Op.CLZ,
Fredrik Svedberg11563172022-07-06 14:54:12 +0200111 Op.Shape,
Jonas Ohlssond8575072022-03-30 10:30:25 +0200112 )
113 )
114 | binary_elem_wise_add_mul_sub
115 | binary_elem_wise_shift_ops
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200116 )
117
Jonas Ohlssond8575072022-03-30 10:30:25 +0200118 relu_ops = set(
119 (
120 Op.Relu,
121 Op.Relu6,
122 Op.ReluN1To1,
123 Op.Clip,
124 )
125 )
Fredrik Svedberg8ddd4892022-08-19 16:06:04 +0200126 activation_ops = relu_ops | set(
127 (
128 Op.Tanh,
129 Op.Sigmoid,
130 Op.Softmax,
131 Op.HardSwish,
132 Op.Prelu,
133 )
134 )
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200135 npu_post_ops = (
136 # activation functions
137 activation_ops
138 # concatenation write direction
139 | set((Op.ConcatSliceWrite,))
140 # Quantization
141 | set((Op.Quantize,))
142 )
Jonas Ohlssond8575072022-03-30 10:30:25 +0200143 split_ops = set(
144 (
145 Op.Split,
146 Op.SplitV,
147 Op.StridedSlice,
148 Op.Slice,
149 Op.UnpackReshaped,
150 Op.Unpack,
151 )
152 )
153 concat_ops = set(
154 (
155 Op.Concat,
156 Op.ConcatTFLite,
157 Op.PackReshaped,
158 Op.Pack,
159 )
160 )
161 memory_only_ops = (
162 set(
163 (
164 Op.Reshape,
165 Op.QuantizedReshape,
166 Op.Squeeze,
167 Op.ExpandDims,
168 )
169 )
170 | concat_ops
171 | split_ops
172 )
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200173 per_axis_quant_ops = convolution_like_ops # per-axis/channel quantization only currently supported for conv ops
Jonas Ohlssond8575072022-03-30 10:30:25 +0200174 supported_fused_activations = relu_ops | set(
175 (
176 Op.Tanh,
177 Op.Sigmoid,
178 Op.LUT,
179 )
180 )
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200181 supported_operators = npu_pre_ops | mac_main_ops | elem_wise_main_ops | pad_ops | npu_post_ops | memory_only_ops
182 # Supported data types
183 supported_op_dtypes = set((DataType.uint8, DataType.int8, DataType.int16, DataType.int32))
184 supported_faf_dtypes = set((DataType.uint8, DataType.int8, DataType.int16))
185 supported_bias_dtypes = set((DataType.int32, DataType.int64))
186 supported_pad_dtypes = set((DataType.int32, DataType.int64))
187 # Defined ranges for allowed values:
188 tens_dim_range = (1, 65535)
189 stride_range = (1, 3)
190 dilation_range = (1, 2)
191 dilated_height_range = (1, 64)
192 dilated_product_range = (1, 64 * 64)
193 weights_limit = 127 * 65536
194 filter_range = (1, 8)
195 filter_height_range = (1, 256)
196 filter_product_range = (1, 256 * 256)
197 mean_kernel_product = 64 * 64
198 mean_kernel_product_int8 = 16 * 16
199 mean_kernel_product_avgpool = 256 * 256
200
201 def __init__(self):
202 # Setup the generic constraints. Note: the order matters
203 self.generic_constraints = []
204 self.generic_constraints.append(TFLiteSupportedOperators.constraint_tens_dtype)
205 self.generic_constraints.append(TFLiteSupportedOperators.constraint_tens_int32_ops)
206 self.generic_constraints.append(TFLiteSupportedOperators.constraint_tens_dimension)
207 self.generic_constraints.append(TFLiteSupportedOperators.constraint_tens_quant_per_axis)
208 self.generic_constraints.append(TFLiteSupportedOperators.constraint_faf)
209 self.generic_constraints.append(TFLiteSupportedOperators.constraint_faf_type)
210
211 # Setup specific constraints. Note: the order matters
212 self.specific_constraints = defaultdict(list)
213
214 # Conv-like checks:
215 for op_type in TFLiteSupportedOperators.convolution_like_ops:
216 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_stride_range)
217 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_dilation_range)
218 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_dilated_height_range)
219 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_dilated_product_range)
220 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_weights_type)
221 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_weights_const)
222 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_weights_limit)
223 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_bias_type)
224 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_bias_40bit)
225 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_batch_size)
226 # Depthwise Conv specific checks:
227 for op_type in TFLiteSupportedOperators.depthwise_convolution_ops:
228 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_depth_multiplier)
229 # Transpose Conv specific checks:
230 for op_type in TFLiteSupportedOperators.transpose_convolution_ops:
231 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_tconv_stride)
232 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_tconv_same)
233 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_tconv_valid)
234
235 # Pooling checks:
236 for op_type in TFLiteSupportedOperators.pooling_ops:
237 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_batch_size)
238 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_stride_range)
239 # AVG pooling specific checks:
240 for op_type in TFLiteSupportedOperators.avg_pooling_ops:
241 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_filter_range)
242 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_filter_height_range_valid_pad)
243 self.specific_constraints[op_type].append(
244 TFLiteSupportedOperators.constraint_filter_product_range_valid_pad
245 )
246 # MAX pooling specific checks:
247 for op_type in TFLiteSupportedOperators.max_pooling_ops:
248 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_filter_height_range)
249 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_filter_product_range)
250
251 # Resizing specific checks:
252 for op_type in TFLiteSupportedOperators.resizing_ops:
Tim Hall885033b2022-07-21 11:46:03 +0100253 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_resize)
254 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_resize_size)
255 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_resize_attrs)
256 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_resize_half_pixel_centers)
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200257
258 # Vector Product specific checks:
259 for op_type in TFLiteSupportedOperators.fc_vector_products:
260 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_weights_type)
261 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_weights_const)
262 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_bias_type)
263 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_bias_40bit)
264
265 # Element-wise checks:
266 for op_type in TFLiteSupportedOperators.elem_wise_main_ops:
267 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_elemwise_batch_size)
268 # Binary Min/Max specific checks:
269 for op_type in TFLiteSupportedOperators.binary_elem_wise_min_max_ops:
270 self.specific_constraints[op_type].append(
271 TFLiteSupportedOperators.constraint_matching_quantization_parameters
272 )
273 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_broadcast_shapes)
274 # Binary Add/Mul/Sub specific checks:
275 for op_type in TFLiteSupportedOperators.binary_elem_wise_add_mul_sub:
276 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_broadcast_shapes)
277 # Binary Shift specific checks:
278 for op_type in TFLiteSupportedOperators.binary_elem_wise_shift_ops:
279 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_inputs_int32)
280 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_broadcast_shapes)
281
282 # SHL specific checks:
283 self.specific_constraints[Op.SHL].append(TFLiteSupportedOperators.constraint_output_int32)
284
285 # CLZ specific checks:
286 self.specific_constraints[Op.CLZ].append(TFLiteSupportedOperators.constraint_output_int32)
287
288 # StridedSlice specific checks:
289 self.specific_constraints[Op.StridedSlice].append(
290 TFLiteSupportedOperators.constraint_stridedslice_stride_values
291 )
292
293 # Pad specific checks:
294 self.specific_constraints[Op.Pad].append(TFLiteSupportedOperators.constraint_pad_shape)
295 self.specific_constraints[Op.Pad].append(TFLiteSupportedOperators.constraint_padding_dimensions)
296 self.specific_constraints[Op.Pad].append(TFLiteSupportedOperators.constraint_pad_type)
297
298 # Mean specific checks:
Dwight Lidmanf54c18d2021-09-29 17:23:03 +0200299 self.specific_constraints[Op.Mean].append(TFLiteSupportedOperators.constraint_batch_size)
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200300 self.specific_constraints[Op.Mean].append(TFLiteSupportedOperators.constraint_mean_height_width_product_avgpool)
301 self.specific_constraints[Op.Mean].append(TFLiteSupportedOperators.constraint_mean_height_width_product)
302 self.specific_constraints[Op.Mean].append(TFLiteSupportedOperators.constraint_mean_height_width_product_int8)
James Peet0bb7ad12022-02-15 15:07:54 +0000303 self.specific_constraints[Op.Mean].append(TFLiteSupportedOperators.constraint_mean_height_single_axis)
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200304
Tim Hall3584a9c2021-11-18 22:05:17 +0000305 # Reshape specific checks:
306 self.specific_constraints[Op.Reshape].append(TFLiteSupportedOperators.constraint_reshape_shape_constant)
Johan Alfvén17009392022-08-30 09:14:56 +0200307 self.specific_constraints[Op.Reshape].append(TFLiteSupportedOperators.constraint_reshape_before_mean)
Tim Hall3584a9c2021-11-18 22:05:17 +0000308
Johan Alfvén8e1352a2022-08-16 13:04:17 +0200309 # Concat specific checks:
310 for op_type in (Op.Concat, Op.ConcatTFLite):
311 self.specific_constraints[op_type].append(
312 TFLiteSupportedOperators.constraint_concat_valid_dimensions_non_axis
313 )
314 self.specific_constraints[op_type].append(TFLiteSupportedOperators.constraint_concat_valid_dimensions_axis)
315
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200316 def is_operator_supported(self, op):
317 ext_type = optype_to_builtintype(op.type)
318 if op.type not in TFLiteSupportedOperators.supported_operators:
319 if op.type not in (Op.Placeholder, Op.SubgraphInput, Op.Const):
320 print(f"Info: {ext_type} '{op.name}' is a CPU only op")
321 return False
322
323 for constraint in self.generic_constraints + self.specific_constraints[op.type]:
324 valid, extra = constraint(op)
325 if not valid:
326 print(f"Warning: {ext_type} '{op.name}' is not supported on the NPU. Placing on CPU instead")
327 print(f" - {constraint.__doc__}")
328 if extra:
329 print(f" {extra}")
330 return False
331
332 return True
333
334 @classmethod
335 @docstring_format_args([list_formatter(supported_op_dtypes)])
336 def constraint_tens_dtype(cls, op):
337 "Tensors must be of type: {}"
338 valid = True
339 extra = []
340 tensors = [tens for tens in op.get_ifm_ifm2_weights_ofm() if tens]
341 if not tensors:
342 tensors = [tens for tens in op.inputs if tens]
343 for tens in tensors:
344 if tens.dtype not in cls.supported_op_dtypes:
345 valid = False
346 extra.append(f"Tensor '{tens.name}' has data type: {tens.dtype}")
347 return valid, ", ".join(extra)
348
349 @classmethod
350 @docstring_format_args([_optype_formatter(supported_int32_tensor_ops)])
351 def constraint_tens_int32_ops(cls, op):
352 "Tensors which are int32 are only valid when op type is: {}"
353 valid = True
354 extra = []
355 tensors = [tens for tens in op.get_ifm_ifm2_weights_ofm() if tens]
356 if not tensors:
357 tensors = [tens for tens in op.inputs if tens]
358 for tens in tensors:
359 if (tens.dtype == DataType.int32) and (op.type not in cls.supported_int32_tensor_ops):
360 valid = False
361 extra.append(tens.name)
362 extra = ", ".join(extra)
363 return valid, f"Op has int32 tensor(s): {extra}"
364
365 @classmethod
366 @docstring_format_args(tens_dim_range)
367 def constraint_tens_dimension(cls, op):
368 "Tensor dimensions must be in the range [{}, {}]"
369 tens_min, tens_max = cls.tens_dim_range
370 valid = True
371 extra = []
372 tensors = [tens for tens in op.get_ifm_ifm2_weights_ofm() if tens]
373 if not tensors:
374 tensors = [tens for tens in op.inputs if tens]
375 for tens in tensors:
376 if not all(tens_min <= dim <= tens_max for dim in tens.shape):
377 valid = False
378 extra.append(f"Tensor '{tens.name}' has shape: {tens.shape}")
379 return valid, ", ".join(extra)
380
381 @classmethod
382 @docstring_format_args([_optype_formatter(per_axis_quant_ops)])
383 def constraint_tens_quant_per_axis(cls, op):
384 "Per-axis quantization is only supported for the following op types: {}"
385 valid = True
386 extra = []
387 if op.type not in cls.per_axis_quant_ops:
388 tensors = [tens for tens in op.get_ifm_ifm2_weights_ofm() if tens]
389 for tens in tensors:
Fredrik Svedberg11563172022-07-06 14:54:12 +0200390 if tens.quantization and tens.quantization.is_per_axis():
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200391 valid = False
392 extra.append(tens.name)
393 return valid, "The following tensor(s) have per-axis quantization parameters: " + ", ".join(extra)
394
395 @classmethod
396 @docstring_format_args([_optype_formatter(supported_fused_activations)])
397 def constraint_faf(cls, op):
398 "The fused activation function (if present) must be one of type: {}"
399 if op.activation is None:
400 res = True, "Op has no fused activation function"
401 else:
402 faf = op.activation.op_type
403 valid = faf in cls.supported_fused_activations
404 res = valid, f"Op has its fused activation function as: {faf}"
405 return res
406
407 @classmethod
408 @docstring_format_args([list_formatter(supported_faf_dtypes)])
409 def constraint_faf_type(cls, op):
410 "If a fused activation function is present, the Output tensor must be one of type: {}"
411 if op.activation is None:
412 res = True, "Op has no fused activation function"
413 else:
414 valid = op.ofm.dtype in cls.supported_faf_dtypes
415 ext_type = optype_to_builtintype(op.activation.op_type)
416 res = valid, f"Op has fused activation function {ext_type}, and Output tensor data type: {op.ofm.dtype}"
417 return res
418
419 @classmethod
420 @docstring_format_args(stride_range)
421 def constraint_stride_range(cls, op):
422 "Stride values for both width and height must be in the range [{}, {}]"
423 w, h = op.get_kernel_stride()
424 stride_min, stride_max = cls.stride_range
425 valid = (stride_min <= w <= stride_max) and (stride_min <= h <= stride_max)
426 return valid, f"Op has stride WxH as: {w}x{h}"
427
428 @classmethod
429 @docstring_format_args(dilation_range)
430 def constraint_dilation_range(cls, op):
431 "Dilation factor values for both width and height must be in the range [{}, {}]"
432 w, h = op.get_kernel_dilation()
433 dilation_min, dilation_max = cls.dilation_range
434 valid = (dilation_min <= w <= dilation_max) and (dilation_min <= h <= dilation_max)
435 return valid, f"Op has dilation factor WxH as: {w}x{h}"
436
437 @classmethod
438 @docstring_format_args(dilated_height_range)
439 def constraint_dilated_height_range(cls, op):
440 "Dilated kernel height must be in the range [{}, {}]"
441 h = op.kernel.area_height()
442 dilated_height_min, dilated_height_max = cls.dilated_height_range
443 valid = dilated_height_min <= h <= dilated_height_max
444 return valid, f"Op has dilated kernel height as: {h}"
445
446 @classmethod
447 @docstring_format_args(dilated_product_range)
448 def constraint_dilated_product_range(cls, op):
449 "Product of dilated kernel width and height must be in the range [{}, {}]"
450 product = op.kernel.area_width() * op.kernel.area_height()
451 dilated_product_min, dilated_product_max = cls.dilated_product_range
452 valid = dilated_product_min <= product <= dilated_product_max
453 return valid, f"Op has product of dilated kernel width and height as: {product}"
454
455 @staticmethod
456 def constraint_weights_type(op):
457 "Weight tensor must be 8-bit"
458 weights = op.weights
459 valid = weights.element_size() == 1
460 return valid, f"Tensor '{weights.name}' is {int(weights.element_size() * 8)}-bit"
461
462 @staticmethod
463 def constraint_weights_const(op):
464 "Weight tensor must be constant"
465 weights = op.weights
466 valid = weights.values is not None
467 return valid, f"Tensor '{weights.name}' has non-constant values"
468
469 @classmethod
470 @docstring_format_args([weights_limit])
471 def constraint_weights_limit(cls, op):
472 "The sum of the weights cannot exceed {}"
473 weights = op.weights
474 values = weights.values.astype(np.int64) - weights.quantization.zero_point
475 limit = np.amax(np.sum(np.absolute(values), axis=(0, 1, 2)))
476 valid = limit <= cls.weights_limit
477 return valid, f"Tensor '{weights.name}' has the sum of weights: {limit}"
478
479 @classmethod
480 @docstring_format_args([list_formatter(supported_bias_dtypes)])
481 def constraint_bias_type(cls, op):
482 "Optional Bias tensor must be of type: {}"
483 bias = op.bias
484 if bias:
485 valid = bias.dtype in cls.supported_bias_dtypes
486 return valid, f"Tensor '{bias.name}' has data type: {bias.dtype}"
487 return True, "Op has no bias tensor"
488
489 @staticmethod
490 def constraint_bias_40bit(op):
491 "Optional Bias tensor values must fit within 40-bits"
492 bias = op.bias
493 if bias and bias.dtype == DataType.int64 and bias.values is not None:
Tim Hall8ae29292021-07-28 16:52:03 +0100494 valid = all(len(bin(value)[2:]) <= 40 for value in bias.values)
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200495 return valid, f"Tensor '{bias.name}' has values larger than 40-bits"
496 return True, "Op has no bias tensor, or it fits in 40-bit"
497
498 @staticmethod
499 def constraint_batch_size(op):
500 "IFM Tensor batch size must be 1"
501 ifm = op.ifm
502 valid = ifm.shape[0] == 1
503 return valid, f"Tensor '{ifm.name}' has batch size: {ifm.shape[0]}"
504
505 @staticmethod
506 def constraint_depth_multiplier(op):
507 "For depth multipliers > 1, IFM channels must be 1 and OFM channels must be equal to the depth multiplier"
508 depth_multiplier = op.attrs.get("depth_multiplier", 1)
509 if depth_multiplier > 1:
510 ifm_channels = op.ifm.shape[3]
511 ofm_channels = op.ofm.shape[3]
512 valid = (ifm_channels == 1) and (ofm_channels == depth_multiplier)
513 extra = (
514 f"Op has ifm_channels={ifm_channels}, ofm_channels={ofm_channels}"
515 f" and depth_multiplier={depth_multiplier}"
516 )
517 return valid, extra
518 return True, "Op has depth_multiplier=1"
519
520 @staticmethod
521 def constraint_tconv_stride(op):
522 "Stride values for both width and height must be 2"
523 w = op.kernel.stride.x
524 h = op.kernel.stride.y
525 valid = (w == 2) and (h == 2)
526 return valid, f"Op has stride WxH as: {w}x{h}"
527
528 @staticmethod
529 def constraint_tconv_same(op):
530 "SAME padding: OFM dimensions must equal IFM dimensions multiplied by stride"
531 if op.attrs["padding"] == Padding.SAME:
532 w = op.kernel.stride.x
533 h = op.kernel.stride.y
534 ifm_shape = op.ifm.shape
535 ofm_shape = op.ofm.shape
536 valid = (ofm_shape[1] == (ifm_shape[1] * h)) and (ofm_shape[2] == (ifm_shape[2] * w))
537 return valid, f"Op has ifm_shape={ifm_shape}, ofm_shape={ofm_shape} and stride WxH as {w}x{h}"
538 return True, "Op has padding=VALID"
539
540 @staticmethod
541 def constraint_tconv_valid(op):
542 """VALID padding: OFM dimensions must equal IFM dimensions multiplied by stride,
Jonas Ohlssond8575072022-03-30 10:30:25 +0200543 minus difference between kernel size and stride"""
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200544 if op.attrs["padding"] == Padding.VALID:
545 s_w = op.kernel.stride.x
546 s_h = op.kernel.stride.y
547 k_w = op.kernel.width
548 k_h = op.kernel.height
549 ifm_shape = op.ifm.shape
550 ofm_shape = op.ofm.shape
551 height_check = ofm_shape[1] == (ifm_shape[1] * s_h + max(k_h - s_h, 0))
552 width_check = ofm_shape[2] == (ifm_shape[2] * s_w + max(k_w - s_w, 0))
553 valid = height_check and width_check
554 extra = (
555 f"Op has ifm_shape={ifm_shape}, ofm_shape={ofm_shape},"
556 f" stride WxH as {s_w}x{s_h} and kernel WxH as {k_w}x{k_h}"
557 )
558 return valid, extra
559 return True, "Op has padding=SAME"
560
561 @classmethod
562 @docstring_format_args(filter_range)
563 def constraint_filter_range(cls, op):
564 "Kernel filter values for both width and height must be in the range [{}, {}]"
565 if op.attrs["padding"] == Padding.SAME:
566 w = op.kernel.width
567 h = op.kernel.height
568 filter_min, filter_max = cls.filter_range
569 valid = (filter_min <= w <= filter_max) and (filter_min <= h <= filter_max)
570 return valid, f"Op has kernel filter WxH as: {w}x{h}"
571 return True, "Op has padding=VALID"
572
573 @classmethod
574 @docstring_format_args(filter_height_range)
575 def constraint_filter_height_range(cls, op):
576 "Kernel filter height must be in the range [{}, {}]"
577 h = op.kernel.height
578 filter_height_min, filter_height_max = cls.filter_height_range
579 valid = filter_height_min <= h <= filter_height_max
580 return valid, f"Op has kernel filter height as: {h}"
581
582 @classmethod
583 @docstring_format_args(filter_product_range)
584 def constraint_filter_product_range(cls, op):
585 "Product of kernel filter width and height must be in the range [{}, {}]"
586 product = op.kernel.elements_wh()
587 filter_product_min, filter_product_max = cls.filter_product_range
588 valid = filter_product_min <= product <= filter_product_max
589 return valid, f"Op has product of kernel filter width and height as: {product}"
590
591 @staticmethod
592 @docstring_format_args(filter_height_range)
593 def constraint_filter_height_range_valid_pad(op):
594 "VALID padding: Kernel filter height must be in the range [{}, {}]"
595 if op.attrs["padding"] == Padding.VALID:
596 return TFLiteSupportedOperators.constraint_filter_height_range(op)
597 return True, "Op has padding=SAME"
598
599 @staticmethod
600 @docstring_format_args(filter_product_range)
601 def constraint_filter_product_range_valid_pad(op):
602 "VALID padding: Product of kernel filter width and height must be in the range [{}, {}]"
603 if op.attrs["padding"] == Padding.VALID:
604 return TFLiteSupportedOperators.constraint_filter_product_range(op)
605 return True, "Op has padding=SAME"
606
607 @staticmethod
Tim Hall885033b2022-07-21 11:46:03 +0100608 def constraint_resize(op):
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200609 """The width and height of the IFM and OFM must match one of the following criteria:
610 IFM W and H must both be 1
611 IFM must match OFM
Tim Hall47c76362022-07-18 21:26:47 +0100612 OFM W and H must be equal and OFM W-1 and H-1 must be 2x/4x/8x IFM W-1 and H-1, if align_corners is True
613 OFM W and H must be equal and OFM W and H must be 2x/4x/8x IFM W and H, if align_corners is False"""
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200614 # Easier to start with False condition as very few cases result in a supported resize
615 valid = False
616 ifm_shape = op.ifm.shape
Tim Hall47c76362022-07-18 21:26:47 +0100617 ifm_shape_h = ifm_shape[1]
618 ifm_shape_w = ifm_shape[2]
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200619 ofm_shape = op.ofm.shape
Tim Hall47c76362022-07-18 21:26:47 +0100620 ofm_shape_h = ofm_shape[1]
621 ofm_shape_w = ofm_shape[2]
622
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200623 align_corners = op.attrs.get("align_corners", False)
624 if len(ifm_shape) == 4:
625 # Valid if IFM W and H are both 1, or IFM and OFM shape are the same
Tim Hall47c76362022-07-18 21:26:47 +0100626 if ((ifm_shape_h == 1) and (ifm_shape_w == 1)) or (ifm_shape == ofm_shape):
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200627 valid = True
628 else:
Rickard Boline546def2022-01-25 15:45:00 +0000629 # Valid if OFM is 2/4/8x IFM (-1 for align corners)
Tim Hall47c76362022-07-18 21:26:47 +0100630 if align_corners:
631 h_upscale_factor = (ofm_shape_h - 1) / (ifm_shape_h - 1)
632 w_upscale_factor = (ofm_shape_w - 1) / (ifm_shape_w - 1)
633 else:
634 h_upscale_factor = ofm_shape_h / ifm_shape_h
635 w_upscale_factor = ofm_shape_w / ifm_shape_w
Rickard Boline546def2022-01-25 15:45:00 +0000636
Tim Hall47c76362022-07-18 21:26:47 +0100637 # could use either height or width. save as int because it is more usable later in graph optimiser
638 op.attrs["upscale_factor"] = int(h_upscale_factor)
639 valid = h_upscale_factor == w_upscale_factor and h_upscale_factor in (2.0, 4.0, 8.0)
Rickard Boline546def2022-01-25 15:45:00 +0000640
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200641 return valid, f"Op has ifm_shape={ifm_shape}, ofm_shape={ofm_shape} and align_corners={align_corners}"
642
643 @staticmethod
Tim Hall885033b2022-07-21 11:46:03 +0100644 def constraint_resize_size(op):
Tim Hall47c76362022-07-18 21:26:47 +0100645 "The size tensor must match the output tensor shape"
646 valid = False
647 ofm_shape = op.ofm.shape
648 size_h, size_w = None, None
649 # check that the size tensor (the second input) exists, is not none, and has the correct values
650 if len(op.inputs) == 2 and op.inputs[1] is not None and len(op.inputs[1].values) == 2:
651 size_h, size_w = op.inputs[1].values
652 # check size and output size match
653 if size_h == ofm_shape[1] and size_w == ofm_shape[2]:
654 valid = True
655
656 return valid, f"Op has size={size_h}x{size_w} and ofm_shape={ofm_shape}."
657
658 @staticmethod
Tim Hall885033b2022-07-21 11:46:03 +0100659 def constraint_resize_attrs(op):
Tim Hall47c76362022-07-18 21:26:47 +0100660 "Both align_corners and half_pixel_centers can't be True"
661 valid = True
662 align_corners = op.attrs.get("align_corners", False)
663 half_pixel_centers = op.attrs.get("half_pixel_centers", False)
664
665 if align_corners and half_pixel_centers:
666 valid = False
667 return valid, "Op has both align_corners and half_pixel_centers set to True."
668
669 @staticmethod
Tim Hall885033b2022-07-21 11:46:03 +0100670 def constraint_resize_half_pixel_centers(op):
erik.andersson@arm.comba2555e2021-10-28 14:08:52 +0200671 "half_pixel_centers are not supported"
672 valid = True
Tim Hall47c76362022-07-18 21:26:47 +0100673 if op.attrs.get("half_pixel_centers", False):
erik.andersson@arm.comba2555e2021-10-28 14:08:52 +0200674 valid = False
675 return valid, f"Op has half_pixel_centers set to {not valid}."
676
677 @staticmethod
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200678 def constraint_pad_shape(op):
679 "The padding tensor must have the shape [3,2] or [4,2]"
680 valid = op.inputs[1].shape in ([3, 2], [4, 2])
681 return valid, f"The pad tensor has the shape: {op.inputs[1].shape}"
682
683 @classmethod
684 @docstring_format_args([list_formatter(supported_pad_dtypes)])
685 def constraint_pad_type(cls, op):
686 "Pad tensor must be of type: {}"
687 pad_tensor = op.inputs[1]
688 valid = pad_tensor.dtype in cls.supported_pad_dtypes
689 return valid, f"Tensor '{pad_tensor.name}' has data type: {pad_tensor.dtype}"
690
691 @staticmethod
692 def constraint_padding_dimensions(op):
693 "The pad tensor can only pad width and height"
694 pad_tensor = op.inputs[1].values
695
696 valid = sum(pad_tensor[-1, :]) == 0
697 if valid and len(pad_tensor) > 3:
698 valid = sum(pad_tensor[0, :]) == 0
699 return valid, f"First dimension padding: {pad_tensor[0,:]}, last dimension padding: {pad_tensor[-1,:]}"
700
701 @staticmethod
702 def constraint_stridedslice_stride_values(op):
703 "All Strides values must be 1"
704 strides = op.inputs[3]
705 valid = all(stride == 1 for stride in strides.values)
706 return valid, f"Op has strides values {strides.values}"
707
708 @staticmethod
709 def constraint_inputs_int32(op):
710 "Both Input data types must be int32"
711 ifm_dtype = op.ifm.dtype
712 ifm2_dtype = op.ifm2.dtype
713 valid = (ifm_dtype == DataType.int32) and (ifm2_dtype == DataType.int32)
714 return valid, f"Op has ifm_dtype={ifm_dtype} and ifm2_dtype={ifm2_dtype}"
715
716 @staticmethod
717 def constraint_output_int32(op):
718 "OFM must be int32"
719 ofm_dtype = op.ofm.dtype
720 valid = ofm_dtype == DataType.int32
721 return valid, f"Op has ofm_dtype={ofm_dtype}"
722
723 @staticmethod
724 def constraint_matching_quantization_parameters(op):
725 "Both Input quantization parameters must match OFM quantization parameters"
726 valid = True
727 extra = []
728 if not check_quantized_tens_scaling_equal(op.ofm, op.ifm):
729 valid = False
730 extra.append(op.ifm.name)
731 if op.ifm2 is not None and not check_quantized_tens_scaling_equal(op.ofm, op.ifm2):
732 valid = False
733 extra.append(op.ifm2.name)
734 extra = ", ".join(extra)
735 return valid, f"Op has tensors with different quantization parameters to the OFM '{op.ofm.name}': {extra}"
736
737 @staticmethod
738 def constraint_elemwise_batch_size(op):
739 "Batch size must be 1 for Input tensors with more than 2 dimensions"
740 valid = True
741 extra = []
742 for tens in (op.ifm, op.ifm2):
743 # Unary ops have ifm2 as None
744 if tens is not None:
745 if (len(tens.shape) > 2) and (tens.shape[0] != 1):
746 valid = False
747 extra.append(tens.name)
748 extra = ", ".join(extra)
749 return valid, f"Op has invalid input tensors: {extra}"
750
751 @staticmethod
752 def constraint_broadcast_shapes(op):
753 "Broadcasting is only allowed for rank indices with dimension 1, from either IFM1 or IFM2"
754 ifm_shape = op.ifm.shape
755 ifm2_shape = op.ifm2.shape if op.ifm2 else None
756 ofm_shape = op.ofm.shape
757 valid = True
758 if ifm_shape is not None and ifm2_shape is not None:
759 # align trailing dimensions
760 size = min(len(ifm_shape), len(ifm2_shape))
761 for i, i2, o in zip(ifm_shape[-size:], ifm2_shape[-size:], ofm_shape[-size:]):
762 mi = max(i, i2)
763 # Input dimensions should match or one should be of dimension 1
764 # Output dimension should match the largest input dimension, together
765 # with constraint_match_either_shapes ensures broadcast from only one input
766 if not (i == i2 or i == 1 or i2 == 1) or o != mi:
767 valid = False
768 break
769
770 return valid, f"Op has ifm_shape={ifm_shape} and ifm2_shape={ifm2_shape}"
771
772 @classmethod
773 @docstring_format_args([mean_kernel_product_avgpool])
774 def constraint_mean_height_width_product_avgpool(cls, op):
James Peet0bb7ad12022-02-15 15:07:54 +0000775 """Product of height and width must be no greater than {}"""
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200776 shape = op.inputs[0].shape
777 hi = 0 if len(shape) < 4 else 1
778 h, w = shape[hi : hi + 2]
779 max_prod = cls.mean_kernel_product_avgpool
780 return h * w <= max_prod, f"Product of height and width is {h * w}"
781
782 @classmethod
783 @docstring_format_args([mean_kernel_product])
784 def constraint_mean_height_width_product(cls, op):
James Peet0bb7ad12022-02-15 15:07:54 +0000785 """Product of height and width must be no greater than {} when:
786 IFM and OFM have different scale or zero point; or
787 'keep_dims' is True"""
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200788 ifmq, ofmq = op.ifm.quantization, op.ofm.quantization
789 keep_dims = op.attrs.get("keep_dims")
790 # doesn't apply, size is checked by constraint_mean_height_width_product_avgpool
791 if not keep_dims and ifmq.scale_f32 == ofmq.scale_f32 and ifmq.zero_point == ofmq.zero_point:
792 return True, ""
793 shape = op.inputs[0].shape
794 hi = 0 if len(shape) < 4 else 1
795 h, w = shape[hi : hi + 2]
796 max_prod = cls.mean_kernel_product
797 return h * w <= max_prod, f"Product of height and width is {h * w}"
798
Johan Alfvén17009392022-08-30 09:14:56 +0200799 @staticmethod
800 def constraint_mean_height_width_product_int8(op):
801 """Number of IFM height and width elements might cause accumulator saturation when;
James Peet0bb7ad12022-02-15 15:07:54 +0000802 The IFM shape has 4 dimensions; and
803 The axis indices specify reduction across 2 dimensions; and
804 The axis indices correspond to the width and height dimensions of the IFM; and
805 'keep_dims' is True; and
Jonas Ohlsson45e653d2021-07-26 16:13:12 +0200806 IFM datatype is int8"""
807 shape = op.ifm.shape
808 axis = int(op.inputs[1].values) if op.inputs[1].shape == [] else list(op.inputs[1].values)
809 # doesn't apply, size is checked by constraint_mean_height_width_product_avgpool
810 # and constraint_mean_height_width_product
811 if (
812 len(shape) != 4
813 or op.ifm.dtype != DataType.int8
814 or not op.attrs.get("keep_dims")
815 or axis not in ([1, 2], [2, 1])
816 ):
817 return True, ""
James Peet0bb7ad12022-02-15 15:07:54 +0000818 h = shape[-3]
819 w = shape[-2]
Johan Alfvén17009392022-08-30 09:14:56 +0200820
821 ifmq, ofmq = op.ifm.quantization, op.ofm.quantization
822
823 # Scale factor
824 real_scale = ifmq.scale_f32 / ofmq.scale_f32
825
826 # Min and max value
827 ifm_min_val = np.iinfo(np.int8).min - ifmq.zero_point
828 ifm_max_val = np.iinfo(np.int8).max - ifmq.zero_point
829
830 # Accumulator limits
831 min_acc_limit = np.iinfo(np.int16).min
832 max_acc_limit = np.iinfo(np.int16).max
833
834 # Theoretical max/min value that accumulator need to store
835 min_acc_sum = h * w * ifm_min_val * real_scale + ofmq.zero_point
836 max_acc_sum = h * w * ifm_max_val * real_scale + ofmq.zero_point
837
838 # Max product of heigth and width that will not saturate the accumulator
839 ifm_min_val = 1 if ifm_min_val == 0 else ifm_min_val
840 ifm_max_val = 1 if ifm_max_val == 0 else ifm_max_val
841 if max_acc_sum > abs(min_acc_sum):
842 max_hw = int((max_acc_limit - ofmq.zero_point) / real_scale / ifm_max_val)
843 else:
844 max_hw = int((min_acc_limit - ofmq.zero_point) / real_scale / ifm_min_val)
845
846 extra = []
847
848 extra.append(f" Possible accumulator range is ({min_acc_sum} - {max_acc_sum})\n")
849 extra.append(f" Maximum accumulator range is ({min_acc_limit} - {max_acc_limit})\n")
850 extra.append(
851 f" Based on the IFM and OFM quantization the IFM height and width must be no greater than {max_hw}"
852 )
853
854 extra = "".join(extra)
855
856 return (min_acc_sum >= min_acc_limit and max_acc_sum <= max_acc_limit, f"\n{extra}")
Tim Hall3584a9c2021-11-18 22:05:17 +0000857
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000858 @classmethod
James Peet0bb7ad12022-02-15 15:07:54 +0000859 @docstring_format_args([filter_height_range[1], dilated_height_range[1]])
860 def constraint_mean_height_single_axis(cls, op):
861 """For single axis averages across the height dimension:
862 IFM height must be no greater than {} if the IFM and OFM scale and zero point match; otherwise
863 IFM height must be no greater than {} if the IFM and OFM scale or zero point do not match"""
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000864 inp, axis = op.inputs
865 if axis.shape == [] or axis.shape[0] == 1: # single axis
866 axis = int(axis.values) if len(axis.shape) == 0 else int(axis.values[0])
867 else:
James Peet0bb7ad12022-02-15 15:07:54 +0000868 # Multiple axes
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000869 return True, ""
870
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000871 shape = inp.shape
James Peet0bb7ad12022-02-15 15:07:54 +0000872 if len(shape) < 3:
873 # No height dimension present in IFM
874 return True, ""
875 if axis != len(shape) - 3:
876 # Not averaging across the height dimension
877 return True, ""
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000878
James Peet0bb7ad12022-02-15 15:07:54 +0000879 h = shape[axis]
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000880 ifm, ofm = op.get_ifm_ofm()
James Peet0bb7ad12022-02-15 15:07:54 +0000881
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000882 if check_quantized_tens_scaling_equal(ifm, ofm):
James Peet0bb7ad12022-02-15 15:07:54 +0000883 return h <= cls.filter_height_range[1], f"Height is {h}, IFM and OFM quantizations match"
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000884 else:
James Peet0bb7ad12022-02-15 15:07:54 +0000885 return h <= cls.dilated_height_range[1], f"Height is {h}, IFM and OFM quantizations do not match"
Rickard Bolin7d7cb672021-12-07 09:09:14 +0000886
Tim Hall3584a9c2021-11-18 22:05:17 +0000887 @staticmethod
888 def constraint_reshape_shape_constant(op):
889 "Shape must be constant"
890 valid = True
891 extra = []
892
893 reshape_tens = op.inputs[1]
894 if reshape_tens is not None:
895 # constant inputs have either no driving operator or a const one
896 # create a list of non-constant inputs
897 if not (len(reshape_tens.ops) == 0 or reshape_tens.ops[0].type == Op.Const):
898 valid = False
899 extra.append(reshape_tens.name)
900 extra = ", ".join(extra)
901
902 return valid, f"Op has non-const input(s): {extra}"
Johan Alfvén8e1352a2022-08-16 13:04:17 +0200903
904 @staticmethod
Johan Alfvén17009392022-08-30 09:14:56 +0200905 def constraint_reshape_before_mean(op):
906 "Reshape on NPU not supported before MEAN operator"
907 for next_op in op.outputs[0].consumers():
908 if next_op is not None and next_op.type == Op.Mean:
909 return False, ""
910 return True, ""
911
912 @staticmethod
Johan Alfvén8e1352a2022-08-16 13:04:17 +0200913 def constraint_concat_valid_dimensions_non_axis(op):
914 """All Input dimensions must match OFM dimension in all axes except the one defined by the axis attribute"""
915 valid = True
916 extra = []
917 ofm_shape = op.ofm.shape
918 ofm_dim = len(ofm_shape)
919 axis = op.attrs["axis"]
920 axis += ofm_dim if axis < 0 else 0
921
922 tensors = [tens for tens in op.inputs if tens]
923 for tens in tensors:
924 if any(tens.shape[dim] != ofm_shape[dim] for dim in range(ofm_dim) if dim != axis):
925 valid = False
926 extra.append(f"Tensor '{tens.name}' has shape: {tens.shape}")
927
928 extra = ", ".join(extra)
929 return valid, f"Op has axis={axis}, ofm_shape={ofm_shape} and the list of mismatching inputs are: {extra}"
930
931 @staticmethod
932 def constraint_concat_valid_dimensions_axis(op):
933 """The size of the OFM axis must match the sum of all IFM axis defined by the axis attribute"""
934 valid = True
935 extra = []
936 ofm_shape = op.ofm.shape
937 ofm_dim = len(ofm_shape)
938 axis = op.attrs["axis"]
939 axis += ofm_dim if axis < 0 else 0
940
941 sum_ifm_axis = 0
942 tensors = [tens for tens in op.inputs if tens]
943 for tens in tensors:
944 sum_ifm_axis += tens.shape[axis]
945 extra.append(f"Tensor '{tens.name}' has shape: {tens.shape}")
946
947 valid = sum_ifm_axis == ofm_shape[axis]
948 extra = ", ".join(extra)
949 return valid, f"Op has axis={axis}, ofm_shape={ofm_shape} and the list of mismatching inputs are: {extra}"