Blame - ethosu/vela/supported_operators.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

1

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# The SupportedOperators class which is a collection of all supported operators and parameter checks.

Charles Xu

87c1350

2020-08-06 12:17:26 +0200

[diff] [blame]

18

import numpy as np

19

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

20

from .data_type import BaseType

21

from .data_type import DataType

Louis Verhaard

2020-09-21 11:56:18 +0200

[diff] [blame]

22

from .operation import get_slice_offsets

23

24

25

def warn_cpu(op, msg):

26

print("Warning: {} {}, placing on CPU".format(op.type, msg))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

27

28

29

class SupportedOperators:

Fredrik Svedberg

880e735

2020-08-25 11:31:47 +0200

[diff] [blame]

30

def __init__(self):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

31

# Categorised lists of supported operators

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

32

self.npu_pre_ops = set(("QuantizedResizeBilinear", "SplitSliceRead",))

33

self.convolution_ops = set(("Conv2DBiasAct", "Conv2D", "QuantizedConv2D",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

34

self.depthwise_convolution_ops = set(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

35

("DepthwiseConv2dBiasAct", "DepthwiseConv2dNative", "QuantizedDepthwiseConv2D,")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

36

)

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

37

self.transpose_convolution_ops = set(("Conv2DBackpropInput",))

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

38

self.max_pooling_ops = set(("QuantizedMaxPool", "MaxPool", "MaxPoolAct",))

39

self.avg_pooling_ops = set(("QuantizedAvgPool", "AvgPool", "AvgPoolAct",))

40

self.pooling_ops = set(("ReduceSum",)) | self.max_pooling_ops | self.avg_pooling_ops

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

41

self.resizing_ops = set(("ResizeBilinear",))

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

42

self.fc_vector_products = set(("QuantizedMatMul", "MatMul", "FullyConnectedAct",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

43

self.mac_main_ops = (

44

# convolutions

45

self.convolution_ops

46

# depth-wise convolutions

47

| self.depthwise_convolution_ops

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

48

# transpose convolutions

49

| self.transpose_convolution_ops

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

50

# pooling

51

| self.pooling_ops

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

52

# resizing/upscaling

53

| self.resizing_ops

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

54

# FC layers

55

| self.fc_vector_products

56

# RNN/LSTM/GRU

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

57

| set(("BlockLSTM",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

58

)

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

59

self.unary_elem_wise_main_ops = set(("LeakyRelu", "Abs", "CLZ",))

60

self.binary_elem_wise_min_max_ops = set(("Minimum", "Maximum",))

Fredrik Svedberg

597fd3f

2020-08-13 10:02:53 +0200

[diff] [blame]

61

self.binary_elem_wise_shift_ops = set(("SHL", "SHR",))

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

62

self.binary_elem_wise_add_mul_sub = set(

Fredrik Svedberg

1575b94

2020-08-18 13:19:18 +0200

[diff] [blame]

63

("AddAct", "MulAct", "SubAct", "QuantizedAdd", "QuantizedSub", "QuantizedMul", "Mul", "Add", "Sub",)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

64

)

Fredrik Svedberg

1575b94

2020-08-18 13:19:18 +0200

[diff] [blame]

65

self.binary_elem_wise_main_ops = (

66

self.binary_elem_wise_min_max_ops | self.binary_elem_wise_add_mul_sub | self.binary_elem_wise_shift_ops

67

)

Dwight Lidman

f995db7

2020-04-27 11:15:12 +0200

[diff] [blame]

68

self.elem_wise_main_ops = self.binary_elem_wise_main_ops | self.unary_elem_wise_main_ops

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

69

self.activation_ops = set(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

(

"QuantizedRelu",

"QuantizedRelu1",

"QuantizedRelu6",

"Relu",

"Relu6",

"ReluN1To1",

"Sigmoid",

"Tanh",

"Softmax",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

81

)

82

self.npu_post_ops = (

83

# activation functions

84

self.activation_ops

85

# concatenation write direction

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

86

| set(("ConcatSliceWrite",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

87

# bias add and batch norm

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

88

| set(("QuantizedBiasAdd", "Requantize", "QuantizedBatchNorm", "BiasAdd", "FusedBatchNorm",))

Jacob Bohlin

9fbc491

2020-06-29 11:58:50 +0200

[diff] [blame]

89

# Quantization

90

| set(("Quantize",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

91

)

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

92

self.split_ops = set(("Split", "SplitV", "StridedSlice", "Slice", "UnpackReshaped", "Unpack",))

93

self.concat_ops = set(("Concat", "ConcatV2", "QuantizedConcat", "ConcatTFLite", "PackReshaped", "Pack",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

self.memory_only_ops = (

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

95

set(("Squeeze", "Reshape", "QuantizedReshape", "ExpandDims",)) | self.concat_ops | self.split_ops

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

96

)

Dwight Lidman

7579c75

2020-08-24 16:05:47 +0200

[diff] [blame]

97

self.shapeless_input_ops = self.binary_elem_wise_main_ops | set(("Split", "SplitV",))

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

98

self.supported_fused_activations = set(("Relu", "Relu6", "ReluN1To1", "Tanh", "Sigmoid", "LUT",))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

99

self.supported_operators = (

100

self.npu_pre_ops | self.mac_main_ops | self.elem_wise_main_ops | self.npu_post_ops | self.memory_only_ops

101

)

102

# Setup supported operator restriction checkers

103

self.supported_operator_restrictions = {}

104

self.supported_operator_restrictions.update(

105

{op: self.check_convolution_restrictions for op in self.convolution_ops}

106

)

107

self.supported_operator_restrictions.update(

108

{op: self.check_depthwise_convolution_restrictions for op in self.depthwise_convolution_ops}

109

)

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

110

self.supported_operator_restrictions.update(

111

{op: self.check_transpose_convolution_restrictions for op in self.transpose_convolution_ops}

112

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

113

self.supported_operator_restrictions.update({op: self.check_pooling_restrictions for op in self.pooling_ops})

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

114

self.supported_operator_restrictions.update({op: self.check_resize_restrictions for op in self.resizing_ops})

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

115

self.supported_operator_restrictions.update(

116

{op: self.check_vector_product_restrictions for op in self.fc_vector_products}

117

)

118

self.supported_operator_restrictions.update(

119

{op: self.check_element_wise_restrictions for op in self.elem_wise_main_ops}

120

)

121

self.supported_operator_restrictions.update(

122

{op: self.check_memory_only_restrictions for op in self.memory_only_ops}

123

)

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

124

self.supported_operator_restrictions.update({op: self.check_activation_ops for op in self.activation_ops})

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

125

126

def is_operator_supported(self, op):

127

if op.type not in self.supported_operators:

128

return False

129

if not self.check_generic_restrictions(op):

130

return False

131

if op.type in self.supported_operator_restrictions:

132

return self.supported_operator_restrictions[op.type](op)

133

return True

134

135

def check_generic_restrictions(self, op):

136

# check fully defined shapes

Dwight Lidman

2020-08-17 11:56:10 +0200

[diff] [blame]

137

for t in op.inputs:

Jacob Bohlin

67e0d8f

2020-08-20 10:53:02 +0200

[diff] [blame]

138

if not t:

139

continue

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

140

if not t.has_fully_defined_shape():

Dwight Lidman

2020-08-17 11:56:10 +0200

[diff] [blame]

141

print("Warning:", op.type, "has input(s) of undefined shape, placing on CPU")

142

return False

Dwight Lidman

7579c75

2020-08-24 16:05:47 +0200

[diff] [blame]

143

if t.shape == [] and op.type not in self.shapeless_input_ops:

Jacob Bohlin

67e0d8f

2020-08-20 10:53:02 +0200

[diff] [blame]

print(

"Warning:",

op.type,

"has input(s) of shape [].",

148

"Scalar input or broadcasting is not supported for this operator,",

149

"placing on CPU",

150

)

Dwight Lidman

2020-08-17 11:56:10 +0200

[diff] [blame]

151

return False

Fredrik Svedberg

2020-09-29 10:00:39 +0200

[diff] [blame]

152

if len(t.shape) > 4:

153

print("Warning:", op.type, "has input(s) of unsupported shape", t.shape, "placing on CPU")

154

return False

Dwight Lidman

2020-08-17 11:56:10 +0200

[diff] [blame]

155

for t in op.outputs:

156

if not t.has_fully_defined_shape():

157

print("Warning:", op.type, "has output(s) of undefined shape, placing on CPU")

158

return False

159

if t.shape == []:

Jacob Bohlin

67e0d8f

2020-08-20 10:53:02 +0200

[diff] [blame]

print(

"Warning:",

op.type,

"has output(s) of shape [].",

164

"Scalar input or broadcasting is not supported for this operator,",

165

"placing on CPU",

166

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

167

return False

Fredrik Svedberg

2020-09-29 10:00:39 +0200

[diff] [blame]

168

if len(t.shape) > 4:

169

print("Warning:", op.type, "has output(s) of unsupported shape", t.shape, "placing on CPU")

170

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

171

172

# check data type

173

tensors = [t for t in op.get_ifm_ifm2_weights_ofm() if t is not None]

if not tensors:

tensors = op.inputs

for t in tensors:

if not (t.dtype.type & BaseType.Int):

178

return False

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

179

if (

180

t.element_size() > 2

Fredrik Svedberg

1575b94

2020-08-18 13:19:18 +0200

[diff] [blame]

181

and op.type

182

not in set(("Requantize", "ReduceSum", "CLZ",))

183

| self.binary_elem_wise_add_mul_sub

184

| self.binary_elem_wise_shift_ops

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

185

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

186

return False

187

# check size

188

if any(dim > 65536 for dim in t.shape):

189

return False

190

191

# check fused activations

192

if (

193

"fused_activation_function" in op.attrs

194

and op.attrs["fused_activation_function"] is not None

195

and op.attrs["fused_activation_function"] not in self.supported_fused_activations

196

):

197

return False

Andreas Nevalainen

eadb166

2020-09-01 15:36:26 +0200

[diff] [blame]

198

199

# check inf values

200

for tens in op.get_ifm_ifm2_weights_ofm():

Patrik Gustavsson

530992a

2020-09-30 13:26:59 +0200

[diff] [blame^]

201

if (

202

(tens is not None)

203

and (tens.quantization is not None)

204

and (tens.quantization.scale_f32 is not None)

205

and (np.isinf(tens.quantization.scale_f32).any())

206

):

Andreas Nevalainen

eadb166

2020-09-01 15:36:26 +0200

[diff] [blame]

207

print("Warning:", op.type, "has inf valued tensor(s), placing on CPU")

208

return False

209

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

210

return True

211

212

def check_convolution_restrictions(self, op):

213

# check stride

Dwight Lidman

0538a77

2020-05-06 14:09:17 +0200

[diff] [blame]

214

if op.attrs["stride_w"] > 3 or op.attrs["stride_h"] > 3:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return False

# check dilation

dilation_w_factor = op.attrs.get("dilation_w_factor", 1)

219

dilation_h_factor = op.attrs.get("dilation_h_factor", 1)

220

if dilation_w_factor > 2 or dilation_h_factor > 2:

221

return False

222

223

# check data type

Jacob Bohlin

2020-08-19 14:36:46 +0200

[diff] [blame]

224

ifm_tensor, _, weight_tensor, bias_tensor, _ = op.get_ifm_ifm2_weights_biases_ofm()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

225

if weight_tensor.element_size() > 1:

226

return False

227

Jacob Bohlin

2020-08-19 14:36:46 +0200

[diff] [blame]

228

if not self.check_bias_restrictions(bias_tensor):

229

return False

230

Andreas Nevalainen

f0c59bf

2020-08-26 10:56:23 +0200

[diff] [blame]

231

# check kernel size [HWIO]

232

dilated_weight_w = weight_tensor.shape[1] + (weight_tensor.shape[1] - 1) * (dilation_w_factor - 1)

233

dilated_weight_h = weight_tensor.shape[0] + (weight_tensor.shape[0] - 1) * (dilation_h_factor - 1)

234

235

if dilated_weight_w > 64 or dilated_weight_h > 64:

236

return False

237

Andreas Nevalainen

8854dc9

2020-09-24 13:43:00 +0200

[diff] [blame]

238

# check non const weights

239

if weight_tensor.values is None:

240

print("Warning:", op.type, "has non-const weights, placing on CPU")

241

return False

242

Andreas Nevalainen

f0c59bf

2020-08-26 10:56:23 +0200

[diff] [blame]

243

# check weight sums over [HWI]

244

zero_point = weight_tensor.quantization.zero_point

245

quant_weights = weight_tensor.quant_values.astype(np.int64)

246

weights = quant_weights - zero_point

247

totals = np.sum(np.absolute(weights), axis=(0, 1, 2))

248

249

if np.amax(totals) > 127 * 65536:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return False

# check batch size

if ifm_tensor.shape[0] != 1:

254

return False

Andreas Nevalainen

d8c032d

2020-09-11 10:25:09 +0200

[diff] [blame]

255

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

256

return True

257

258

def check_depthwise_convolution_restrictions(self, op):

259

# check depth

260

ifm_tensor, _, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()

261

if op.attrs["depth_multiplier"] > 1 and not (

262

(ifm_tensor.shape[3] == 1) and (ofm_tensor.shape[3] == op.attrs["depth_multiplier"])

263

):

264

return False

265

return self.check_convolution_restrictions(op)

266

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

267

def check_transpose_convolution_restrictions(self, op):

268

# check stride

269

stride_h, stride_w = op.attrs["stride_h"], op.attrs["stride_w"]

270

if stride_h != stride_w != 2:

271

return False

272

273

# check output dimensions

274

ifm_tensor, weight_tensor, _, ofm_tensor = op.get_ifm_weights_biases_ofm()

275

ifm_h, ifm_w = ifm_tensor.shape[1], ifm_tensor.shape[2]

276

ofm_h, ofm_w = ofm_tensor.shape[1], ofm_tensor.shape[2]

277

if op.attrs["padding"] == b"SAME":

278

if (ofm_h != ifm_h * stride_h) or (ofm_w != ifm_w * stride_w):

279

return False

280

elif op.attrs["padding"] == b"VALID":

281

kernel_h, kernel_w = weight_tensor.shape[0], weight_tensor.shape[1]

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

282

if (ofm_h != (ifm_h) * stride_h + max(kernel_h - stride_h, 0)) or (

283

ofm_w != (ifm_w) * stride_w + max(kernel_w - stride_w, 0)

284

):

Jacob Bohlin

2020-05-20 09:03:40 +0200

[diff] [blame]

285

return False

286

287

return self.check_convolution_restrictions(op)

288

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

289

def check_pooling_restrictions(self, op):

290

# check stride

Dwight Lidman

0538a77

2020-05-06 14:09:17 +0200

[diff] [blame]

291

if op.attrs["stride_w"] > 3 or op.attrs["stride_h"] > 3:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return False

# check data type

ifm_tensor, _, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()

296

if ifm_tensor.dtype != ofm_tensor.dtype:

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

297

if op.type != "ReduceSum":

298

return False

299

# TODO: else check ReduceSum restrictions.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

300

301

# check batch size

302

if ifm_tensor.shape[0] != 1:

303

return False

304

305

if op.type in self.avg_pooling_ops:

306

# check kernel size

307

if op.attrs["padding"] == b"SAME" and (op.attrs["filter_width"] > 8 or op.attrs["filter_height"] > 8):

308

return False

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

309

if op.attrs["padding"] == b"VALID" and (

310

op.attrs["filter_width"] * op.attrs["filter_height"] > 256 * 256 or op.attrs["filter_height"] > 256

311

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

312

return False

313

314

if op.type in self.max_pooling_ops:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

315

# check kernel size (any padding)

316

if op.attrs["filter_width"] * op.attrs["filter_height"] > 256 * 256 or op.attrs["filter_height"] > 256:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return False

return True

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

320

def check_resize_restrictions(self, op):

321

# check unsupported upscaling factor

322

if op.type == "ResizeBilinear":

Charles Xu

9a03fdf

2020-07-02 15:12:40 +0200

[diff] [blame]

323

if op.inputs[0].shape[1] == 1 and op.inputs[0].shape[2] == 1:

324

return True

Charles Xu

36ffaf3

2020-08-05 15:40:44 +0200

[diff] [blame]

325

if op.inputs[0].shape == op.outputs[0].shape:

326

return True

Charles Xu

87c1350

2020-08-06 12:17:26 +0200

[diff] [blame]

327

upscaled_shape = np.array(op.inputs[0].shape[1:3])

328

out_shape = np.array(op.outputs[0].shape[1:3])

329

while (upscaled_shape < out_shape).all():

330

upscaled_shape *= 2

331

if op.attrs["align_corners"]:

332

upscaled_shape -= 1

333

if np.array_equal(out_shape, upscaled_shape):

334

return True

335

return False

Dwight Lidman

2020-05-29 09:37:03 +0200

[diff] [blame]

336

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

337

def check_vector_product_restrictions(self, op):

338

# check data type

Jacob Bohlin

2020-08-19 14:36:46 +0200

[diff] [blame]

339

_, _, weight_tensor, bias_tensor, _ = op.get_ifm_ifm2_weights_biases_ofm()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

340

if weight_tensor.element_size() > 1:

341

return False

342

Jacob Bohlin

2020-08-19 14:36:46 +0200

[diff] [blame]

343

if not self.check_bias_restrictions(bias_tensor):

344

return False

345

Andreas Nevalainen

d8c032d

2020-09-11 10:25:09 +0200

[diff] [blame]

346

# check non const weights

347

if weight_tensor.values is None:

348

print("Warning:", op.type, "has non-const weights, placing on CPU")

349

return False

350

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

351

return True

352

353

def check_element_wise_restrictions(self, op):

354

# check data type

355

ifm_tensor, ifm2_tensor, _, ofm_tensor = op.get_ifm_ifm2_weights_ofm()

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

356

# input and output datatype must match for these operators

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

357

if (

358

op.type in self.binary_elem_wise_min_max_ops | self.unary_elem_wise_main_ops

359

and ifm_tensor.dtype != ofm_tensor.dtype

360

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

361

return False

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

362

if op.type in self.binary_elem_wise_add_mul_sub:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

363

# both inputs must have same type

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

364

if ifm_tensor.dtype != ifm2_tensor.dtype:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

365

return False

366

# signed input check

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

367

if ifm_tensor.dtype.type & BaseType.Signed:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

368

# output must be signed

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

369

if ofm_tensor.dtype.type & BaseType.Unsigned:

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

370

return False

371

# and 8, 16 or 32-bit

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

372

if ofm_tensor.element_size() not in (1, 2, 4):

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

373

return False

374

# unsigned input check, output must be same type or int32

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

375

if ifm_tensor.dtype.type & BaseType.Unsigned and not (

376

ifm_tensor.dtype == ofm_tensor.dtype or ofm_tensor.dtype == DataType.int32

377

):

Fredrik Svedberg

2020-05-25 16:32:00 +0200

[diff] [blame]

378

return False

Fredrik Svedberg

597fd3f

2020-08-13 10:02:53 +0200

[diff] [blame]

379

elif op.type in self.binary_elem_wise_shift_ops | set(("CLZ")):

380

if ifm_tensor.dtype != DataType.int32 or ifm2_tensor.dtype != DataType.int32:

381

return False

382

if op.type in ("CLZ", "SHL") and ofm_tensor.dtype != DataType.int32:

383

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

384

385

# check batch size

Dwight Lidman

f995db7

2020-04-27 11:15:12 +0200

[diff] [blame]

386

if len(ifm_tensor.shape) > 2 and ifm_tensor.shape[0] != 1:

Tim Hall

2020-06-15 20:47:35 +0100

[diff] [blame]

387

return False

388

if op.type in self.binary_elem_wise_main_ops: # if op type is unary, ifm2_tensor is None

Dwight Lidman

f995db7

2020-04-27 11:15:12 +0200

[diff] [blame]

389

if len(ifm2_tensor.shape) > 2 and ifm2_tensor.shape[0] != 1:

390

return False

Dwight Lidman

332a704

2020-06-11 15:32:42 +0200

[diff] [blame]

391

392

# negative alpha values are not supported

393

if op.type == "LeakyRelu" and op.attrs["alpha"] < 0:

394

return False

395

Andreas Nevalainen

d8c032d

2020-09-11 10:25:09 +0200

[diff] [blame]

396

# check if ifm or ifm2 has ofm shape

397

if ifm_tensor.shape != ofm_tensor.shape and ifm2_tensor.shape != ofm_tensor.shape:

398

return False

399

Patrik Gustavsson

530992a

2020-09-30 13:26:59 +0200

[diff] [blame^]

400

if op.type in self.binary_elem_wise_min_max_ops and not self.check_quantization_restrictions_binary_elem_wise(

op

):

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

return True

406

407

def check_memory_only_restrictions(self, op):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

408

if op.type == "StridedSlice":

Louis Verhaard

2020-09-21 11:56:18 +0200

[diff] [blame]

409

if len(op.inputs) != 4:

410

warn_cpu(op, "has {} input tensors, only 4 inputs are supported".format(len(op.inputs)))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

411

return False

Louis Verhaard

2020-09-21 11:56:18 +0200

[diff] [blame]

412

input_tens, begin_tens, end_tens, strides_tens = op.inputs

413

if begin_tens.values is None or end_tens.values is None or strides_tens.values is None:

414

warn_cpu(op, "has a non-constant begin, end, or stride input tensor, which is not supported")

415

return False

416

if not (

417

len(input_tens.shape)

418

== len(op.outputs[0].shape)

419

== len(begin_tens.values)

420

== len(end_tens.values)

421

== len(strides_tens.values)

422

):

423

warn_cpu(op, "has input tensors with shapes that are not supported")

424

return False

425

# check stride size

426

if any(stride != 1 for stride in strides_tens.values):

427

warn_cpu(op, "has stride values {}, only stride 1 values are supported".format(strides_tens.values))

Michael McGeagh

ecd2052

2020-07-31 16:59:45 +0100

[diff] [blame]

428

return False

Patrik Gustavsson

cf72890

2020-04-30 08:57:23 +0200

[diff] [blame]

429

# check ellipsis_mask

430

if op.attrs["ellipsis_mask"] != 0:

Louis Verhaard

2020-09-21 11:56:18 +0200

[diff] [blame]

431

warn_cpu(op, "ellipsis_mask is {}, only 0 is supported".format(op.attrs["ellipsis_mask"]))

Patrik Gustavsson

cf72890

2020-04-30 08:57:23 +0200

[diff] [blame]

432

return False

433

# check if both new_axis_mask and shrink_axis_mask have bit set

434

if op.attrs["new_axis_mask"] != 0 and op.attrs["shrink_axis_mask"] != 0:

Louis Verhaard

2020-09-21 11:56:18 +0200

[diff] [blame]

435

warn_cpu(op, "new_axis_mask and shrink_axis_mask are both non-zero, which is not supported")

436

return False

437

# Calculate offset start/end

438

offset_start = get_slice_offsets(input_tens.shape, begin_tens, op.attrs["begin_mask"], is_begin=True)

439

offset_end = get_slice_offsets(input_tens.shape, end_tens, op.attrs["end_mask"], is_begin=False)

440

# check "end - begin" doesn't result in any zero or negative elements

441

if any((end - begin) <= 0 for begin, end in zip(offset_start, offset_end)):

442

warn_cpu(

443

op,

444

"has slice begin values {}, some of which are >= end values {}, which is illegal".format(

445

begin_tens.values, end_tens.values

446

),

447

)

Patrik Gustavsson

cf72890

2020-04-30 08:57:23 +0200

[diff] [blame]

448

return False

Patrik Gustavsson

271ddc3

2020-09-01 09:15:27 +0200

[diff] [blame]

449

if op.type == "SplitV":

450

# check that maximum one size is set to -1, indicating that size should be inferred

451

sizes = op.inputs[1].values

452

num_to_be_inferred = 0

453

for size in sizes:

454

if size == -1:

455

num_to_be_inferred += 1

456

457

if num_to_be_inferred > 1:

458

print("Warning:", op.type, "has more than one size to be inferred, which is illegal, placing on CPU")

459

return False

Fredrik Svedberg

2020-09-29 10:00:39 +0200

[diff] [blame]

460

if op.type.find("Concat") != -1:

461

axis = op.attrs.get("axis", None)

462

if axis is None:

463

print("Warning:", op.type, "invalid or missing axis, placing on CPU")

464

return False

465

if axis < 0:

466

axis += len(op.inputs[0].shape)

467

if not 0 < axis < len(op.inputs[0].shape):

468

print("Warning:", op.type, "invalid axis", axis, ", placing on CPU")

469

return False

470

ofm = op.outputs[0]

471

ofm_dims = len(ofm.shape)

472

for ifm in op.inputs:

473

if len(ifm.shape) != ofm_dims:

474

return False

475

for i in range(ofm_dims):

476

if i != axis and ifm.shape[i] != ofm.shape[i]:

Patrik Gustavsson

530992a

2020-09-30 13:26:59 +0200

[diff] [blame^]

print(

"Warning:",

op.type,

"invalid ifm:",

ifm.name,

ifm.shape,

"mismatch in dimension",

484

i,

485

", placing on CPU",

486

)

Fredrik Svedberg

2020-09-29 10:00:39 +0200

[diff] [blame]

487

return False

Patrik Gustavsson

271ddc3

2020-09-01 09:15:27 +0200

[diff] [blame]

488

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

489

return True

Dwight Lidman

ebe26c7

2020-06-09 11:40:54 +0200

[diff] [blame]

490

Tim Hall

2020-07-28 17:40:50 +0100

[diff] [blame]

491

def check_quantization_restrictions_binary_elem_wise(self, op):

Dwight Lidman

ebe26c7

2020-06-09 11:40:54 +0200

[diff] [blame]

492

# makes sure IFM1, IFM2 and OFM quantization are equal for binary ops

Tim Hall

2020-07-28 17:40:50 +0100

[diff] [blame]

493

assert len(op.inputs) >= 2 and len(op.outputs) == 1

494

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

495

if (

Tim Hall

2020-07-28 17:40:50 +0100

[diff] [blame]

496

op.inputs[0].quantization is None

Michael McGeagh

34ad19b

2020-09-04 15:44:23 +0100

[diff] [blame]

497

or not op.inputs[0].is_scaling_equal(op.inputs[1])

498

or not op.inputs[0].is_scaling_equal(op.outputs[0])

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

499

):

500

print(

501

"Warning: Input/output tensors with different quantization is unsupported for the", op.type, "operator"

502

)

Dwight Lidman

ebe26c7

2020-06-09 11:40:54 +0200

[diff] [blame]

503

return False

Tim Hall

2020-07-28 17:40:50 +0100

[diff] [blame]

504

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

505

return True

506

507

def check_activation_ops(self, op):

508

if op.type == "Softmax":

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

509

ifm_tensor = op.inputs[0]

510

ofm_tensor = op.outputs[0]

511

512

# check data type

513

if ifm_tensor.dtype != ofm_tensor.dtype:

514

return False

515

Fredrik Svedberg

597fd3f

2020-08-13 10:02:53 +0200

[diff] [blame]

516

if ifm_tensor.dtype not in (DataType.uint8, DataType.int8, DataType.int16):

517

return False

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

518

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

519

# check shape

520

if len(ifm_tensor.shape) > 4 or ifm_tensor.shape != ofm_tensor.shape:

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

521

return False

522

523

return True

Jacob Bohlin

2020-08-19 14:36:46 +0200

[diff] [blame]

524

525

def check_bias_restrictions(self, bias_tensor):

526

# check data type

Jacob Bohlin

258ebba

2020-08-31 10:44:35 +0200

[diff] [blame]

527

if bias_tensor is not None and bias_tensor.dtype not in (DataType.int32, DataType.int64):

Jacob Bohlin

2020-08-19 14:36:46 +0200

[diff] [blame]

528

return False

529

530

# check if values fits in 40-bit

Jacob Bohlin

258ebba

2020-08-31 10:44:35 +0200

[diff] [blame]

531

if bias_tensor is not None and bias_tensor.dtype == DataType.int64:

Tim Hall

7152517

2020-08-29 15:09:57 +0100

[diff] [blame]

532

for quant_value in bias_tensor.quant_values:

533

if not (-(1 << 39) <= quant_value < (1 << 39)):

Jacob Bohlin