Blame - ethosu/vela/supported_operators.py - ml/ethos-u/ethos-u-vela

blob: 1a25887f28baf81b28150e540a0fc828d4506997 [file] [log] [blame]

Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	1	# Copyright (C) 2020 Arm Limited or its affiliates. All rights reserved.
				2	#
				3	# SPDX-License-Identifier: Apache-2.0
				4	#
				5	# Licensed under the Apache License, Version 2.0 (the License); you may
				6	# not use this file except in compliance with the License.
				7	# You may obtain a copy of the License at
				8	#
				9	# www.apache.org/licenses/LICENSE-2.0
				10	#
				11	# Unless required by applicable law or agreed to in writing, software
				12	# distributed under the License is distributed on an AS IS BASIS, WITHOUT
				13	# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
				14	# See the License for the specific language governing permissions and
				15	# limitations under the License.
				16
				17
				18	# Description:
				19	# The SupportedOperators class which is a collection of all supported operators and parameter checks.
				20
				21	from .data_type import BaseType
				22
				23
				24	class SupportedOperators:
				25	def __init__(self):
				26	# Categorised lists of supported operators
				27	self.npu_pre_ops = set(("QuantizedResizeBilinear", "SplitSliceRead"))
				28	self.convolution_ops = set(("Conv2DBiasAct", "Conv2D", "QuantizedConv2D", "Conv2DBackpropInputSwitched"))
				29	self.depthwise_convolution_ops = set(
				30	("DepthwiseConv2dBiasAct", "DepthwiseConv2dNative", "QuantizedDepthwiseConv2D")
				31	)
				32	self.max_pooling_ops = set(("QuantizedMaxPool", "MaxPool", "MaxPoolAct"))
				33	self.avg_pooling_ops = set(("QuantizedAvgPool", "AvgPool", "AvgPoolAct"))
				34	self.pooling_ops = self.max_pooling_ops \| self.avg_pooling_ops
				35	self.fc_vector_products = set(("QuantizedMatMul", "MatMul", "FullyConnectedAct"))
				36	self.mac_main_ops = (
				37	# convolutions
				38	self.convolution_ops
				39	# depth-wise convolutions
				40	\| self.depthwise_convolution_ops
				41	# pooling
				42	\| self.pooling_ops
				43	# FC layers
				44	\| self.fc_vector_products
				45	# RNN/LSTM/GRU
				46	\| set(("BlockLSTM"))
				47	)
Dwight Lidman	f995db7	2020-04-27 11:15:12 +0200	[diff] [blame]	48	self.unary_elem_wise_main_ops = set(("LeakyRelu", "Abs"))
				49	self.binary_elem_wise_main_ops = set(
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	50	(
Dwight Lidman	f995db7	2020-04-27 11:15:12 +0200	[diff] [blame]	51	# binary element-wise
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	52	"AddAct",
				53	"MulAct",
				54	"SubAct",
				55	"QuantizedAdd",
				56	"QuantizedSub",
				57	"QuantizedMul",
				58	"Mul",
				59	"Add",
				60	"Sub",
				61	"Minimum",
				62	"Maximum",
				63	)
				64	)
Dwight Lidman	f995db7	2020-04-27 11:15:12 +0200	[diff] [blame]	65	self.elem_wise_main_ops = self.binary_elem_wise_main_ops \| self.unary_elem_wise_main_ops
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	66	self.activation_ops = set(
				67	("QuantizedRelu", "QuantizedRelu1", "QuantizedRelu6", "Relu", "Relu6", "ReluN1To1", "Sigmoid", "Tanh")
				68	)
				69	self.npu_post_ops = (
				70	# activation functions
				71	self.activation_ops
				72	# concatenation write direction
				73	\| set(("ConcatSliceWrite"))
				74	# bias add and batch norm
				75	\| set(("QuantizedBiasAdd", "Requantize", "QuantizedBatchNorm", "BiasAdd", "FusedBatchNorm"))
				76	)
				77	self.split_ops = set(("Split", "StridedSlice", "Slice", "UnpackReshaped", "Unpack"))
				78	self.concat_ops = set(("Concat", "ConcatV2", "QuantizedConcat", "ConcatTFLite", "PackReshaped", "Pack"))
				79	self.memory_only_ops = (
				80	set(("Squeeze", "Reshape", "QuantizedReshape", "ExpandDims")) \| self.concat_ops \| self.split_ops
				81	)
				82	self.supported_fused_activations = set(("Relu", "Relu6", "ReluN1To1", "Tanh", "Sigmoid"))
				83	self.supported_operators = (
				84	self.npu_pre_ops \| self.mac_main_ops \| self.elem_wise_main_ops \| self.npu_post_ops \| self.memory_only_ops
				85	)
				86	# Setup supported operator restriction checkers
				87	self.supported_operator_restrictions = {}
				88	self.supported_operator_restrictions.update(
				89	{op: self.check_convolution_restrictions for op in self.convolution_ops}
				90	)
				91	self.supported_operator_restrictions.update(
				92	{op: self.check_depthwise_convolution_restrictions for op in self.depthwise_convolution_ops}
				93	)
				94	self.supported_operator_restrictions.update({op: self.check_pooling_restrictions for op in self.pooling_ops})
				95	self.supported_operator_restrictions.update(
				96	{op: self.check_vector_product_restrictions for op in self.fc_vector_products}
				97	)
				98	self.supported_operator_restrictions.update(
				99	{op: self.check_element_wise_restrictions for op in self.elem_wise_main_ops}
				100	)
				101	self.supported_operator_restrictions.update(
				102	{op: self.check_memory_only_restrictions for op in self.memory_only_ops}
				103	)
				104
				105	def is_operator_supported(self, op):
				106	if op.type not in self.supported_operators:
				107	return False
				108	if not self.check_generic_restrictions(op):
				109	return False
				110	if op.type in self.supported_operator_restrictions:
				111	return self.supported_operator_restrictions[op.type](op)
				112	return True
				113
				114	def check_generic_restrictions(self, op):
				115	# check fully defined shapes
				116	for t in op.inputs + op.outputs:
				117	if not t.has_fully_defined_shape():
				118	print("Warning:", op, "has inputs/outputs of undefined shape, placing on CPU")
				119	return False
				120
				121	# check data type
				122	tensors = [t for t in op.get_ifm_ifm2_weights_ofm() if t is not None]
				123	if not tensors:
				124	tensors = op.inputs
				125	for t in tensors:
				126	if not (t.dtype.type & BaseType.Int):
				127	return False
				128	if t.element_size() > 2 and op.type != "Requantize":
				129	return False
				130	# check size
				131	if any(dim > 65536 for dim in t.shape):
				132	return False
				133
				134	# check fused activations
				135	if (
				136	"fused_activation_function" in op.attrs
				137	and op.attrs["fused_activation_function"] is not None
				138	and op.attrs["fused_activation_function"] not in self.supported_fused_activations
				139	):
				140	return False
				141	return True
				142
				143	def check_convolution_restrictions(self, op):
				144	# check stride
Dwight Lidman	0538a77	2020-05-06 14:09:17 +0200	[diff] [blame]	145	if op.attrs["stride_w"] > 3 or op.attrs["stride_h"] > 3:
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	146	return False
				147
				148	# check dilation
				149	dilation_w_factor = op.attrs.get("dilation_w_factor", 1)
				150	dilation_h_factor = op.attrs.get("dilation_h_factor", 1)
				151	if dilation_w_factor > 2 or dilation_h_factor > 2:
				152	return False
				153
				154	# check data type
				155	ifm_tensor, _, weight_tensor, _ = op.get_ifm_ifm2_weights_ofm()
				156	if weight_tensor.element_size() > 1:
				157	return False
				158
				159	# check kernel size
				160	dilated_weight_w = weight_tensor.shape[0] + (weight_tensor.shape[0] - 1) * (dilation_w_factor - 1)
				161	dilated_weight_h = weight_tensor.shape[1] + (weight_tensor.shape[1] - 1) * (dilation_h_factor - 1)
				162	if (
				163	dilated_weight_w > 64
				164	or dilated_weight_h > 64
				165	or dilated_weight_w * dilated_weight_h * weight_tensor.shape[2] > 127 * 65536
				166	):
				167	return False
				168
				169	# check batch size
				170	if ifm_tensor.shape[0] != 1:
				171	return False
				172	return True
				173
				174	def check_depthwise_convolution_restrictions(self, op):
				175	# check depth
				176	ifm_tensor, _, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()
				177	if op.attrs["depth_multiplier"] > 1 and not (
				178	(ifm_tensor.shape[3] == 1) and (ofm_tensor.shape[3] == op.attrs["depth_multiplier"])
				179	):
				180	return False
				181	return self.check_convolution_restrictions(op)
				182
				183	def check_pooling_restrictions(self, op):
				184	# check stride
Dwight Lidman	0538a77	2020-05-06 14:09:17 +0200	[diff] [blame]	185	if op.attrs["stride_w"] > 3 or op.attrs["stride_h"] > 3:
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	186	return False
				187
				188	# check data type
				189	ifm_tensor, _, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()
				190	if ifm_tensor.dtype != ofm_tensor.dtype:
				191	return False
				192
				193	# check batch size
				194	if ifm_tensor.shape[0] != 1:
				195	return False
				196
				197	if op.type in self.avg_pooling_ops:
				198	# check kernel size
				199	if op.attrs["padding"] == b"SAME" and (op.attrs["filter_width"] > 8 or op.attrs["filter_height"] > 8):
				200	return False
				201	if op.attrs["padding"] == b"VALID" and (op.attrs["filter_width"] > 256 or op.attrs["filter_height"] > 256):
				202	return False
				203
				204	if op.type in self.max_pooling_ops:
				205	# check data type
				206	if not ifm_tensor.dtype == ofm_tensor.dtype:
				207	return False
				208	# check kernel size
				209	if op.attrs["filter_width"] > 256 or op.attrs["filter_height"] > 256: # any padding
				210	return False
				211	return True
				212
				213	def check_vector_product_restrictions(self, op):
				214	# check data type
				215	ifm_tensor, _, weight_tensor, _ = op.get_ifm_ifm2_weights_ofm()
				216	if weight_tensor.element_size() > 1:
				217	return False
				218
				219	return True
				220
				221	def check_element_wise_restrictions(self, op):
				222	# check data type
				223	ifm_tensor, ifm2_tensor, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()
				224	if op.type in ("Minimum", "Maximum") and ifm_tensor.dtype != ofm_tensor.dtype:
				225	return False
				226
				227	# check batch size
Dwight Lidman	f995db7	2020-04-27 11:15:12 +0200	[diff] [blame]	228	if len(ifm_tensor.shape) > 2 and ifm_tensor.shape[0] != 1:
				229	return False
				230	if op.type in self.binary_elem_wise_main_ops: # if op type is unary, ifm2_tensor is None
				231	if len(ifm2_tensor.shape) > 2 and ifm2_tensor.shape[0] != 1:
				232	return False
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	233
				234	# check scalar size
Dwight Lidman	f995db7	2020-04-27 11:15:12 +0200	[diff] [blame]	235	if hasattr(ifm_tensor.values, "__len__") and len(ifm_tensor.values) > 1:
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	236	return False
Dwight Lidman	f995db7	2020-04-27 11:15:12 +0200	[diff] [blame]	237	if op.type in self.binary_elem_wise_main_ops: # same as above
				238	if hasattr(ifm2_tensor.values, "__len__") and len(ifm2_tensor.values) > 1:
				239	return False
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	240	return True
				241
				242	def check_memory_only_restrictions(self, op):
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	243	if op.type == "StridedSlice":
Patrik Gustavsson	cf72890	2020-04-30 08:57:23 +0200	[diff] [blame^]	244	# check stride size
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	245	if len(op.inputs) > 3 and any(stride != 1 for stride in op.inputs[3].values):
				246	return False
Patrik Gustavsson	cf72890	2020-04-30 08:57:23 +0200	[diff] [blame^]	247	# check ellipsis_mask
				248	if op.attrs["ellipsis_mask"] != 0:
				249	return False
				250	# check if both new_axis_mask and shrink_axis_mask have bit set
				251	if op.attrs["new_axis_mask"] != 0 and op.attrs["shrink_axis_mask"] != 0:
				252	return False
Tim Hall	79d07d2	2020-04-27 18:20:16 +0100	[diff] [blame]	253	return True