Blame - ethosu/vela/supported_operators.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

1

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# The SupportedOperators class which is a collection of all supported operators and parameter checks.

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

18

from .data_type import BaseType

19

from .data_type import DataType

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

21

22

class SupportedOperators:

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

23

def __init__(self, softmax_support):

24

self.softmax_support = softmax_support

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

25

# Categorised lists of supported operators

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

26

self.npu_pre_ops = set(("QuantizedResizeBilinear", "SplitSliceRead",))

27

self.convolution_ops = set(("Conv2DBiasAct", "Conv2D", "QuantizedConv2D",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

28

self.depthwise_convolution_ops = set(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

29

("DepthwiseConv2dBiasAct", "DepthwiseConv2dNative", "QuantizedDepthwiseConv2D,")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

30

)

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

31

self.transpose_convolution_ops = set(("Conv2DBackpropInput",))

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

32

self.max_pooling_ops = set(("QuantizedMaxPool", "MaxPool", "MaxPoolAct",))

33

self.avg_pooling_ops = set(("QuantizedAvgPool", "AvgPool", "AvgPoolAct",))

34

self.pooling_ops = set(("ReduceSum",)) | self.max_pooling_ops | self.avg_pooling_ops

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

35

self.resizing_ops = set(("ResizeBilinear",))

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

36

self.fc_vector_products = set(("QuantizedMatMul", "MatMul", "FullyConnectedAct",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

37

self.mac_main_ops = (

38

# convolutions

39

self.convolution_ops

40

# depth-wise convolutions

41

| self.depthwise_convolution_ops

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

42

# transpose convolutions

43

| self.transpose_convolution_ops

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

44

# pooling

45

| self.pooling_ops

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

46

# resizing/upscaling

47

| self.resizing_ops

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

48

# FC layers

49

| self.fc_vector_products

50

# RNN/LSTM/GRU

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

51

| set(("BlockLSTM",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

52

)

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

53

self.unary_elem_wise_main_ops = set(("LeakyRelu", "Abs", "CLZ",))

54

self.binary_elem_wise_min_max_ops = set(("Minimum", "Maximum",))

Fredrik Svedberg

2020-08-13 10:02:53 +0200

[diff] [blame^]

55

self.binary_elem_wise_shift_ops = set(("SHL", "SHR",))

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

56

self.binary_elem_wise_add_mul_sub = set(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

(

"AddAct",

"MulAct",

"SubAct",

"QuantizedAdd",

"QuantizedSub",

"QuantizedMul",

"Mul",

"Add",

"Sub",

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

67

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

68

)

Fredrik Svedberg

2020-08-13 10:02:53 +0200

[diff] [blame^]

69

self.binary_elem_wise_main_ops = self.binary_elem_wise_min_max_ops | self.binary_elem_wise_add_mul_sub | self.binary_elem_wise_shift_ops

Dwight Lidman

f995db7

2020-04-27 11:15:12 +0200

[diff] [blame]

70

self.elem_wise_main_ops = self.binary_elem_wise_main_ops | self.unary_elem_wise_main_ops

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

71

self.activation_ops = set(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

(

"QuantizedRelu",

"QuantizedRelu1",

"QuantizedRelu6",

"Relu",

"Relu6",

"ReluN1To1",

"Sigmoid",

"Tanh",

"Softmax",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

83

)

84

self.npu_post_ops = (

85

# activation functions

86

self.activation_ops

87

# concatenation write direction

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

88

| set(("ConcatSliceWrite",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

89

# bias add and batch norm

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

90

| set(("QuantizedBiasAdd", "Requantize", "QuantizedBatchNorm", "BiasAdd", "FusedBatchNorm",))

Jacob Bohlin

9fbc491

2020-06-29 11:58:50 +0200

[diff] [blame]

91

# Quantization

92

| set(("Quantize",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

93

)

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

94

self.split_ops = set(("Split", "SplitV", "StridedSlice", "Slice", "UnpackReshaped", "Unpack",))

95

self.concat_ops = set(("Concat", "ConcatV2", "QuantizedConcat", "ConcatTFLite", "PackReshaped", "Pack",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

96

self.memory_only_ops = (

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

97

set(("Squeeze", "Reshape", "QuantizedReshape", "ExpandDims",)) | self.concat_ops | self.split_ops

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

98

)

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

99

self.supported_fused_activations = set(("Relu", "Relu6", "ReluN1To1", "Tanh", "Sigmoid", "LUT",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

self.supported_operators = (

101

self.npu_pre_ops | self.mac_main_ops | self.elem_wise_main_ops | self.npu_post_ops | self.memory_only_ops

102

)

103

# Setup supported operator restriction checkers

104

self.supported_operator_restrictions = {}

105

self.supported_operator_restrictions.update(

106

{op: self.check_convolution_restrictions for op in self.convolution_ops}

107

)

108

self.supported_operator_restrictions.update(

109

{op: self.check_depthwise_convolution_restrictions for op in self.depthwise_convolution_ops}

110

)

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

111

self.supported_operator_restrictions.update(

112

{op: self.check_transpose_convolution_restrictions for op in self.transpose_convolution_ops}

113

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

114

self.supported_operator_restrictions.update({op: self.check_pooling_restrictions for op in self.pooling_ops})

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

115

self.supported_operator_restrictions.update({op: self.check_resize_restrictions for op in self.resizing_ops})

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

116

self.supported_operator_restrictions.update(

117

{op: self.check_vector_product_restrictions for op in self.fc_vector_products}

118

)

119

self.supported_operator_restrictions.update(

120

{op: self.check_element_wise_restrictions for op in self.elem_wise_main_ops}

121

)

122

self.supported_operator_restrictions.update(

123

{op: self.check_memory_only_restrictions for op in self.memory_only_ops}

124

)

Dwight Lidman

ebe26c7

2020-06-09 11:40:54 +0200

[diff] [blame]

125

self.supported_operator_restrictions.update(

126

{op: self.check_quantization_restrictions for op in self.binary_elem_wise_min_max_ops}

127

)

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

128

self.supported_operator_restrictions.update({op: self.check_activation_ops for op in self.activation_ops})

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

129

130

def is_operator_supported(self, op):

131

if op.type not in self.supported_operators:

132

return False

133

if not self.check_generic_restrictions(op):

134

return False

135

if op.type in self.supported_operator_restrictions:

136

return self.supported_operator_restrictions[op.type](op)

137

return True

138

139

def check_generic_restrictions(self, op):

140

# check fully defined shapes

141

for t in op.inputs + op.outputs:

142

if not t.has_fully_defined_shape():

143

print("Warning:", op, "has inputs/outputs of undefined shape, placing on CPU")

return False

# check data type

tensors = [t for t in op.get_ifm_ifm2_weights_ofm() if t is not None]

if not tensors:

tensors = op.inputs

for t in tensors:

if not (t.dtype.type & BaseType.Int):

152

return False

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

153

if (

154

t.element_size() > 2

Fredrik Svedberg

2020-08-13 10:02:53 +0200

[diff] [blame^]

155

and op.type not in set(("Requantize", "ReduceSum", "CLZ",)) | self.binary_elem_wise_add_mul_sub | self.binary_elem_wise_shift_ops

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

156

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

157

return False

158

# check size

159

if any(dim > 65536 for dim in t.shape):

160

return False

161

162

# check fused activations

163

if (

164

"fused_activation_function" in op.attrs

165

and op.attrs["fused_activation_function"] is not None

166

and op.attrs["fused_activation_function"] not in self.supported_fused_activations

):

return False

return True

def check_convolution_restrictions(self, op):

172

# check stride

Dwight Lidman

0538a77

2020-05-06 14:09:17 +0200

[diff] [blame]

173

if op.attrs["stride_w"] > 3 or op.attrs["stride_h"] > 3:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return False

# check dilation

dilation_w_factor = op.attrs.get("dilation_w_factor", 1)

178

dilation_h_factor = op.attrs.get("dilation_h_factor", 1)

179

if dilation_w_factor > 2 or dilation_h_factor > 2:

return False

# check data type

ifm_tensor, _, weight_tensor, _ = op.get_ifm_ifm2_weights_ofm()

184

if weight_tensor.element_size() > 1:

return False

# check kernel size

dilated_weight_w = weight_tensor.shape[0] + (weight_tensor.shape[0] - 1) * (dilation_w_factor - 1)

189

dilated_weight_h = weight_tensor.shape[1] + (weight_tensor.shape[1] - 1) * (dilation_h_factor - 1)

190

if (

191

dilated_weight_w > 64

192

or dilated_weight_h > 64

193

or dilated_weight_w * dilated_weight_h * weight_tensor.shape[2] > 127 * 65536

):

return False

# check batch size

if ifm_tensor.shape[0] != 1:

return False

return True

def check_depthwise_convolution_restrictions(self, op):

203

# check depth

204

ifm_tensor, _, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()

205

if op.attrs["depth_multiplier"] > 1 and not (

206

(ifm_tensor.shape[3] == 1) and (ofm_tensor.shape[3] == op.attrs["depth_multiplier"])

207

):

208

return False

209

return self.check_convolution_restrictions(op)

210

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

211

def check_transpose_convolution_restrictions(self, op):

212

# check stride

213

stride_h, stride_w = op.attrs["stride_h"], op.attrs["stride_w"]

214

if stride_h != stride_w != 2:

215

return False

216

217

# check output dimensions

218

ifm_tensor, weight_tensor, _, ofm_tensor = op.get_ifm_weights_biases_ofm()

219

ifm_h, ifm_w = ifm_tensor.shape[1], ifm_tensor.shape[2]

220

ofm_h, ofm_w = ofm_tensor.shape[1], ofm_tensor.shape[2]

221

if op.attrs["padding"] == b"SAME":

222

if (ofm_h != ifm_h * stride_h) or (ofm_w != ifm_w * stride_w):

223

return False

224

elif op.attrs["padding"] == b"VALID":

225

kernel_h, kernel_w = weight_tensor.shape[0], weight_tensor.shape[1]

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

226

if (ofm_h != (ifm_h) * stride_h + max(kernel_h - stride_h, 0)) or (

227

ofm_w != (ifm_w) * stride_w + max(kernel_w - stride_w, 0)

228

):

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

229

return False

230

231

return self.check_convolution_restrictions(op)

232

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

233

def check_pooling_restrictions(self, op):

234

# check stride

Dwight Lidman

0538a77

2020-05-06 14:09:17 +0200

[diff] [blame]

235

if op.attrs["stride_w"] > 3 or op.attrs["stride_h"] > 3:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return False

# check data type

ifm_tensor, _, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()

240

if ifm_tensor.dtype != ofm_tensor.dtype:

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

241

if op.type != "ReduceSum":

242

return False

243

# TODO: else check ReduceSum restrictions.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

244

245

# check batch size

246

if ifm_tensor.shape[0] != 1:

247

return False

248

249

if op.type in self.avg_pooling_ops:

250

# check kernel size

251

if op.attrs["padding"] == b"SAME" and (op.attrs["filter_width"] > 8 or op.attrs["filter_height"] > 8):

252

return False

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

253

if op.attrs["padding"] == b"VALID" and (

254

op.attrs["filter_width"] * op.attrs["filter_height"] > 256 * 256 or op.attrs["filter_height"] > 256

255

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

256

return False

257

258

if op.type in self.max_pooling_ops:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

259

# check kernel size (any padding)

260

if op.attrs["filter_width"] * op.attrs["filter_height"] > 256 * 256 or op.attrs["filter_height"] > 256:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return False

return True

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

264

def check_resize_restrictions(self, op):

265

# check unsupported upscaling factor

266

if op.type == "ResizeBilinear":

Charles Xu

9a03fdf

2020-07-02 15:12:40 +0200

[diff] [blame]

267

if op.inputs[0].shape[1] == 1 and op.inputs[0].shape[2] == 1:

268

return True

Charles Xu

36ffaf3

2020-08-05 15:40:44 +0200

[diff] [blame]

269

if op.inputs[0].shape == op.outputs[0].shape:

270

return True

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

271

upscaled_shape = [op.inputs[0].shape[1] * 2, op.inputs[0].shape[2] * 2]

272

out_shape = op.outputs[0].shape[1:3]

273

if not op.attrs["align_corners"] and out_shape != upscaled_shape:

274

return False

275

elif op.attrs["align_corners"] and out_shape != [upscaled_shape[0] - 1, upscaled_shape[1] - 1]:

return False

return True

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

279

def check_vector_product_restrictions(self, op):

280

# check data type

281

ifm_tensor, _, weight_tensor, _ = op.get_ifm_ifm2_weights_ofm()

282

if weight_tensor.element_size() > 1:

return False

return True

def check_element_wise_restrictions(self, op):

288

# check data type

289

ifm_tensor, ifm2_tensor, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

290

# input and output datatype must match for these operators

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

291

if (

292

op.type in self.binary_elem_wise_min_max_ops | self.unary_elem_wise_main_ops

293

and ifm_tensor.dtype != ofm_tensor.dtype

294

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

295

return False

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

296

if op.type in self.binary_elem_wise_add_mul_sub:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

297

# both inputs must have same type

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

298

if ifm_tensor.dtype != ifm2_tensor.dtype:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

299

return False

300

# signed input check

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

301

if ifm_tensor.dtype.type & BaseType.Signed:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

302

# output must be signed

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

303

if ofm_tensor.dtype.type & BaseType.Unsigned:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

304

return False

305

# and 8, 16 or 32-bit

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

306

if ofm_tensor.element_size() not in (1, 2, 4):

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

307

return False

308

# unsigned input check, output must be same type or int32

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

309

if ifm_tensor.dtype.type & BaseType.Unsigned and not (

310

ifm_tensor.dtype == ofm_tensor.dtype or ofm_tensor.dtype == DataType.int32

311

):

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

312

return False

Fredrik Svedberg

2020-08-13 10:02:53 +0200

[diff] [blame^]

313

elif op.type in self.binary_elem_wise_shift_ops | set(("CLZ")):

314

if ifm_tensor.dtype != DataType.int32 or ifm2_tensor.dtype != DataType.int32:

315

return False

316

if op.type in ("CLZ", "SHL") and ofm_tensor.dtype != DataType.int32:

317

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

318

319

# check batch size

Dwight Lidman

f995db7

2020-04-27 11:15:12 +0200

[diff] [blame]

320

if len(ifm_tensor.shape) > 2 and ifm_tensor.shape[0] != 1:

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

321

return False

322

if op.type in self.binary_elem_wise_main_ops: # if op type is unary, ifm2_tensor is None

Dwight Lidman

f995db7

2020-04-27 11:15:12 +0200

[diff] [blame]

323

if len(ifm2_tensor.shape) > 2 and ifm2_tensor.shape[0] != 1:

324

return False

Dwight Lidman

332a704

2020-06-11 15:32:42 +0200

[diff] [blame]

325

326

# negative alpha values are not supported

327

if op.type == "LeakyRelu" and op.attrs["alpha"] < 0:

328

return False

329

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

330

return True

331

332

def check_memory_only_restrictions(self, op):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

333

if op.type == "StridedSlice":

Patrik Gustavsson

cf72890

2020-04-30 08:57:23 +0200

[diff] [blame]

334

# check stride size

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

335

if len(op.inputs) > 3 and any(stride != 1 for stride in op.inputs[3].values):

336

return False

Michael McGeagh

ecd2052

2020-07-31 16:59:45 +0100

[diff] [blame]

337

# check "end - begin" doesnt result in any zero or negative elements

338

if any((end - begin) <= 0 for begin, end in zip(op.inputs[1].values, op.inputs[2].values)):

339

return False

Patrik Gustavsson

cf72890

2020-04-30 08:57:23 +0200

[diff] [blame]

340

# check ellipsis_mask

341

if op.attrs["ellipsis_mask"] != 0:

342

return False

343

# check if both new_axis_mask and shrink_axis_mask have bit set

344

if op.attrs["new_axis_mask"] != 0 and op.attrs["shrink_axis_mask"] != 0:

345

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

346

return True

Dwight Lidman

ebe26c7

2020-06-09 11:40:54 +0200

[diff] [blame]

347

348

def check_quantization_restrictions(self, op):

349

# makes sure IFM1, IFM2 and OFM quantization are equal for binary ops

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

350

if (

351

len(op.inputs) == 2

352

and not op.inputs[0].quantization == op.inputs[1].quantization == op.outputs[0].quantization

353

):

354

print(

355

"Warning: Input/output tensors with different quantization is unsupported for the", op.type, "operator"

356

)

Dwight Lidman

ebe26c7

2020-06-09 11:40:54 +0200

[diff] [blame]

357

return False

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

358

return True

359

360

def check_activation_ops(self, op):

361

if op.type == "Softmax":

362

if not self.softmax_support:

363

return False

364

365

ifm_tensor = op.inputs[0]

366

ofm_tensor = op.outputs[0]

367

368

# check data type

369

if ifm_tensor.dtype != ofm_tensor.dtype:

370

return False

371

Fredrik Svedberg

2020-08-13 10:02:53 +0200

[diff] [blame^]

372

if ifm_tensor.dtype not in (DataType.uint8, DataType.int8, DataType.int16):

373

return False

Fredrik Svedberg