Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

1

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame^]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

39

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

40

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

41

from .operation import Operation

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

42

43

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

44

45

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

46

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

53

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

54

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

55

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

56

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

57

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

58

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

59

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

60

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

61

def all():

62

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

68

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

74

return self.name

75

76

def identifier_name(self):

77

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

82

83

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

84

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

90

Shram = 5 # for LUT

91

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

92

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

93

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

94

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

95

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

96

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

97

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

98

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

99

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

101

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

a0c3624

2020-06-03 15:43:31 +0200

[diff] [blame]

112

LUT = 4

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

113

FSBias = 5

114

Size = 6

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

115

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

116

def display_name(self) -> str:

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

117

return ("Unknown", "Weights", "FeatureMap", "Scratch", "LUT", "FastStorageBias", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def identifier_name(self) -> str:

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

120

return ("unknown", "weights", "feature_map", "scratch", "lut", "fast_storage_bias", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

121

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

122

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

def all():

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

124

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

125

126

127

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

134

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

135

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

136

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

137

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

138

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

139

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

140

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

141

def all():

142

return (

143

TensorSubPurpose.Standard,

144

TensorSubPurpose.DoubleBuffer,

145

TensorSubPurpose.RollingBufferX,

146

TensorSubPurpose.RollingBufferY,

147

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

152

Unknown = 0

153

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

168

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

179

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

188

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

189

new_shp = list(shp)

190

191

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

192

for i in range(-1, -len(shp) - 1, -1):

193

if new_shp[i] is not None:

194

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

198

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

199

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

200

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

204

class QuantizationParameters:

205

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

206

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

207

def __init__(

208

self,

209

min: Union[float, np.ndarray, None] = None,

210

max: Union[float, np.ndarray, None] = None,

211

num_bits=None,

212

narrow_range=None,

213

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

218

self.narrow_range = narrow_range

219

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

220

self.scale_f32: Union[float, np.ndarray, None] = None

221

self.zero_point: Union[int, np.ndarray, None] = None

222

self.quant_min: Optional[float] = None

223

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

224

225

def __str__(self):

226

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

236

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

237

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

242

res.narrow_range = self.narrow_range

243

244

res.scale_f32 = self.scale_f32

245

res.zero_point = self.zero_point

246

res.quant_min = self.quant_min

247

res.quant_max = self.quant_max

248

return res

249

250

def dequantize(self, values):

251

if self.zero_point.size == 1 and self.scale_f32.size == 1:

252

# same scale is used for all values

253

res = (values.astype(np.float64) - self.zero_point) * self.scale_f32

254

else:

255

# a different scale is used for different sets of values

256

values_as_float = values.astype(np.float64)

257

258

# this is not compatible with the format of depthwise weights,

259

# where input is at index 3 (Output, Kh, Kw, Input)

260

# return the quantized values

261

return np.ndarray((values_as_float.shape))

262

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

263

return res

264

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

265

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

266

# quantisation parameter scaling is not equal if 'other' is None because

267

# it implies that the tensor it belongs to is not quantised. otherwise,

268

# it depends upon whether the scale and zero point are equal

269

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

270

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

271

return False

272

273

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

274

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

275

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

276

# quantisation parameters are consider valid if they have a scale and zero point

277

278

return None not in (self.scale_f32, self.zero_point)

279

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

280

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

281

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

282

for attr in ("scale_f32", "zero_point", "min", "max"):

283

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

287

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

288

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

294

purpose: TensorPurpose = TensorPurpose.Unknown,

295

quantization: QuantizationParameters = None,

296

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

297

# Tensor

298

const_tensor = Tensor(shape, dtype, name + "_0")

299

const_tensor.purpose = purpose

300

const_tensor.quantization = quantization

301

const_tensor.values = np.array(values, dtype=value_dtype)

Jacob Bohlin

a41cd4d

2020-08-26 18:21:28 +0200

[diff] [blame]

302

const_tensor.quant_values = np.frombuffer(const_tensor.values.tobytes(), dtype=np.uint8)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

303

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

304

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

305

const_op.set_output_tensor(const_tensor)

return const_tensor

def create_reshape_tensor(tens, shape, ifm_reshape=True):

310

if shape == tens.shape:

311

return tens

312

# Tensors

313

name = tens.name + "_reshape"

314

reshape_ifm = tens

315

reshape_ofm = tens.clone("_reshaped")

316

reshape_ofm.set_all_shapes(shape)

317

if not ifm_reshape:

318

reshape_ifm, reshape_ofm = reshape_ofm, reshape_ifm

319

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

320

reshape_op = Operation(Op.Reshape, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

321

reshape_op.attrs["new_shape"] = shape

322

reshape_op.add_input_tensor(reshape_ifm)

323

reshape_op.add_input_tensor(create_const_tensor(name + "_shape", [1], DataType.int32, shape))

324

reshape_op.set_output_tensor(reshape_ofm)

325

return reshape_ofm if ifm_reshape else reshape_ifm

326

327

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

328

# class that keeps track of all tensor addresses in the different memory types

329

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

330

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

331

332

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

333

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

334

return cls.address_map[tens_id].get(mem_type)

335

336

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

337

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

338

# Check previous address if there is one

339

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

340

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

341

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

342

343

# Set tensor's address for memory type

344

cls.address_map[tens_id][mem_type] = address

345

346

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

347

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

"ops",

"consumer_list",

"values",

"quant_values",

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

360

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

361

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

362

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

368

"storage_compression_scale",

369

"bandwidth_compression_scale",

370

"compression_scale_for_worst_weight_stream",

371

"weight_compression_scales",

372

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

373

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

374

"storage_rounding_quantum",

375

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

376

"quantization",

377

"weight_compressed_offsets",

378

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

379

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

380

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

381

"resampling_mode",

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

382

"avoid_NHCWB16",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

383

)

384

AllocationQuantum = 16

385

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

386

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

387

self.shape = shape

388

self.storage_shape = shape

389

self.bandwidth_shape = shape

390

self.dtype = dtype

391

self.name = name

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

392

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

393

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

394

self.ops: List[Operation] = []

395

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

396

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

397

self.values: Optional[np.ndarray] = None

398

self.quant_values: Optional[np.ndarray] = None

399

self.compressed_values: Optional[np.ndarray] = None

400

self.compressed_values_substream_offsets: Optional[List] = None

401

self.mem_area: MemArea = MemArea.Unknown

402

self.mem_type: MemType = MemType.Unknown

403

self.format: TensorFormat = TensorFormat.Unknown

404

self.purpose: TensorPurpose = TensorPurpose.Unknown

405

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

406

self.alignment: int = Tensor.AllocationQuantum

407

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

408

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

409

self.storage_compression_scale: float = 1.0

410

self.bandwidth_compression_scale: float = 1.0

411

self.compression_scale_for_worst_weight_stream: float = 1.0

412

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

413

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

414

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

415

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

416

self.value_id: UUID = uuid.uuid4()

417

self.weight_compressed_offsets: List = []

418

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

419

self.brick_size: Tuple = (1, 1, 1, 1)

420

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

421

422

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

423

self.quantization: Optional[QuantizationParameters] = None

424

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

425

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

426

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

427

self.avoid_NHCWB16: bool = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

428

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

429

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

430

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

431

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

432

433

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

434

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

435

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

436

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

437

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

438

if self.element_size_bytes == 0:

439

return self.dtype.size_in_bits() / 8

440

return self.element_size_bytes

441

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

442

# Returns a copy, renamed to self.name + suffix

443

# The references to Operators will be empty when returned

444

# Depending on set_unique, the copy is shallow, or deep

445

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

446

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

447

if set_unique:

448

res = copy.deepcopy(self)

449

res.equivalence_id = uuid.uuid4()

450

else:

451

res = copy.copy(self)

452

res.storage_shape = list(self.storage_shape)

453

res.bandwidth_shape = list(self.bandwidth_shape)

454

if self.quantization is not None:

455

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

456

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

457

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

458

res.ops = []

459

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

460

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

461

return res

462

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

463

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

464

res = self.clone(suffix="_fast_storage")

465

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

466

res.mem_type = MemType.Scratch_fast

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

467

return res

468

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

469

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

470

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

471

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

472

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

473

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

474

self.storage_shape = src_tens.storage_shape

475

self.brick_size = src_tens.brick_size

476

self.weight_compression_scales = src_tens.weight_compression_scales

477

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

478

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

479

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

480

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

481

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

482

self.block_traversal = src_tens.block_traversal

483

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

484

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

485

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

486

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

494

if shape_len > 4:

495

return

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

496

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

497

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

498

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

499

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

500

if self.shape is None:

501

return

502

503

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

504

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

505

506

if fmt == TensorFormat.WeightsCompressed:

507

compression_ratio = 5 / 8

508

self.storage_compression_scale = compression_ratio

509

self.bandwidth_compression_scale = compression_ratio

510

self.compression_scale_for_worst_weight_stream = compression_ratio

511

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

512

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

513

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

518

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

519

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

524

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

525

return shape_fully_defined(self.shape)

526

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

527

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

528

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

529

if raw_size == 0:

530

raw_size = 1 # force it to take up space

531

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

532

return rounded_size

533

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

534

def storage_size_for_sub_purpose(

535

self, arch, sub_purpose: TensorSubPurpose, param_a: Optional[int] = None, param_b: Optional[int] = None

536

) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

537

alt_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

538

elems = shape_num_elements(alt_shape)

539

if elems is None:

540

return 0

541

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

542

raw_size = (

543

elems

544

* self.element_size()

545

* self.compression_scale_for_worst_weight_stream

546

* arch.weight_estimation_scaling

547

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

548

else:

Patrik Gustavsson

9baa4c3

2020-08-20 13:59:01 +0200

[diff] [blame]

549

# Rolling buffers are used for intermediate data in ifm streaming

550

# These will all use the NHCWB16 format, and need to be aligned to 16 in the C-dimension

551

if alt_shape[-1] % 16 != 0:

552

nhcwb16_shape = alt_shape[0:-1] + [numeric_util.round_up(alt_shape[-1], 16)]

553

elems = shape_num_elements(nhcwb16_shape)

554

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

555

raw_size = elems * self.element_size() * self.storage_compression_scale

556

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

557

return rounded_size

558

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

559

def storage_shape_for_sub_purpose(

560

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

561

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

562

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

563

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

564

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

565

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

566

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

567

else:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

568

shp = list(self.storage_shape)

569

if sub_purpose == TensorSubPurpose.RollingBufferX:

570

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

571

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

572

shp[0] = 1

573

shp[2] = min(shp[2], param_a)

574

elif sub_purpose == TensorSubPurpose.RollingBufferY:

575

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

576

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

577

shp[0] = 1

578

shp[1] = min(shp[1], param_a)

579

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

580

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

581

assert param_a is not None

582

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

583

shp[0] = 1

584

shp[2] = min(shp[2], param_a)

585

shp[1] = min(shp[1], param_b)

586

elif sub_purpose == TensorSubPurpose.Standard:

587

pass

588

else:

589

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

590

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

591

return shp

592

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

593

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

594

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

595

self.sub_purpose = sub_purpose

596

if sub_purpose == TensorSubPurpose.DoubleBuffer:

597

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

598

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

599

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

600

elems = shape_num_elements(self.bandwidth_shape)

601

if elems is None:

602

return 0

603

return elems * self.element_size() * self.bandwidth_compression_scale

604

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

605

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

606

return self.consumer_list

607

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

608

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

609

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

610

611

if len(start_coord) < 4:

box_height0 = 1

box_width = 1

if len(start_coord) >= 2:

616

box_width = end_coord[-2] - start_coord[-2]

617

618

return box_height0, box_height0, box_width, [self.address_for_coordinate(start_coord), None, None, None]

619

620

crossing_y = numeric_util.round_up(start_coord[1] + 1, self.storage_shape[1])

621

crossing_x = numeric_util.round_up(start_coord[2] + 1, self.storage_shape[2])

622

623

crossing_y = min(crossing_y, end_coord[1])

624

crossing_x = min(crossing_x, end_coord[2])

625

626

box_height0 = crossing_y - start_coord[1]

627

box_width = crossing_x - start_coord[2]

628

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

629

addresses: List = [None] * 4

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

630

addresses[0] = self.address_for_coordinate(start_coord)

631

632

if end_coord[2] > crossing_x:

633

addresses[1] = self.address_for_coordinate([start_coord[0], start_coord[1], crossing_x, start_coord[3]])

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame^]

634

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

635

if end_coord[1] > crossing_y:

636

addresses[2] = self.address_for_coordinate([start_coord[0], crossing_y, start_coord[2], start_coord[3]])

637

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

638

addresses[3] = self.address_for_coordinate([start_coord[0], crossing_y, crossing_x, start_coord[3]])

639

640

return box_height0, box_height0, box_width, addresses

641

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

642

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False) -> int:

643

offset = self.address_offset_for_coordinate(coord, is_top_box)

644

assert offset is not None

645

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

646

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

647

def get_strides_and_coord(self, coord: Optional[Shape] = None) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

648

if coord is None:

649

coord = [0] * len(self.storage_shape)

650

651

augmented_coord = coord

652

augmented_shape = self.storage_shape

653

while len(augmented_shape) < 4:

654

augmented_shape = [1] + augmented_shape

655

656

while len(augmented_coord) < 4:

657

augmented_coord = [0] + augmented_coord

658

659

assert len(augmented_coord) == len(augmented_shape)

660

661

if self.format == TensorFormat.NHWC:

662

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

663

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

664

665

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

666

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

667

augmented_shape = augmented_shape[0:4] + [1]

668

augmented_coord = (

669

[augmented_coord[0], augmented_coord[3] // channel_divisor]

670

+ augmented_coord[1:3]

671

+ [augmented_coord[3] % channel_divisor]

672

)

673

674

if augmented_shape[1] == 0:

675

augmented_shape[1] = 1

676

677

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

678

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

679

return None, None

680

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

681

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

682

stride = self.element_size() * self.storage_compression_scale

683

684

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

685

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

686

for i in stride_order:

687

strides[i] = stride

688

stride *= augmented_shape[i]

689

else:

690

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

691

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

692

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

693

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

694

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

695

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

696

697

return strides, augmented_coord

698

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

699

def get_strides(self) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

700

strides, _ = self.get_strides_and_coord()

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

701

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

702

return strides

703

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

704

def needs_dma(self) -> bool:

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

705

return len(self.ops) == 1 and self.ops[0].type == Op.DMA

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

706

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

707

def get_dma_src_tensor(self) -> "Optional[Tensor]":

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

708

# For weight tensors that need DMA: returns the source tensor in Flash, else None

709

# Note: for DMA ops, Pass.weight_tensor is referring to the SRAM weight tensor

710

return self.ops[0].inputs[0] if self.needs_dma() else None

711

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

712

def find_npu_op(self) -> Optional[Operation]:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

713

# Returns the NPU operator that uses this tensor, excluding DMA operators.

714

for op in self.consumers():

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

715

if op.type == Op.DMA:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

716

return op.outputs[0].find_npu_op()

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

717

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

718

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

719

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

720

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

721

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

722

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

723

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

724

assert len(self.compressed_values) > 0

725

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

726

727

depth = coord[-1]

728

brick_depth = self.brick_size[-1]

729

# Clamp position at final element index

730

if depth > self.shape[-1]:

731

depth = self.shape[-1]

732

733

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

734

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

735

736

# Check boundaries on all but last weight set (which may be shorter

737

# than the brick we divided it up into)

738

if index < len(self.weight_compressed_offsets) - 1:

739

# There are no half-way points in the weights

740

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame^]

741

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

745

def size_of_compressed_stream(self, index: int) -> int:

746

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

747

assert 0 <= index < len(self.compressed_values)

748

return len(self.compressed_values[index])

749

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

750

def is_last_index_in_compressed_stream(self, index: int) -> bool:

751

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

752

assert 0 <= index < len(self.compressed_values)

753

return index == len(self.compressed_values) - 1

754

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

755

def address_offset_for_coordinate(self, orig_coord: Shape, is_top_box: bool = False) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

address_offset = 0

coord = orig_coord

coord = coord[-len(self.storage_shape) :]

760

761

if self.sub_purpose == TensorSubPurpose.Standard:

762

for idx, c in enumerate(coord):

763

if is_top_box:

764

assert c > 0 and c <= self.shape[idx]

765

else:

766

assert c >= 0 and c < self.shape[idx]

767

768

if self.format == TensorFormat.WeightsCompressed:

769

if len(self.weight_compressed_offsets) == 0:

770

return 0

771

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

772

if self.needs_dma() and self.sub_purpose == TensorSubPurpose.DoubleBuffer:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

773

depth = orig_coord[-1]

774

brick_depth = self.brick_size[-1]

775

# Clamp position at final element index

776

if depth > self.shape[-1]:

777

depth = self.shape[-1]

778

779

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

780

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

781

index = index % 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

782

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

783

784

if len(self.compressed_values) <= 2:

785

if is_top_box and index == 0:

786

for cv in self.compressed_values:

787

address_offset += len(cv)

788

else:

789

address_offset = index * len(self.compressed_values[0])

790

else:

791

if is_top_box and index == 0:

792

address_offset = self.storage_shape[-1]

793

else:

794

address_offset = index * (self.storage_shape[-1] // 2)

795

else:

796

index = self.compressed_stream_index_from_coord(orig_coord)

797

assert index < len(self.weight_compressed_offsets)

798

address_offset = self.weight_compressed_offsets[index]

799

else:

800

if is_top_box:

801

coord = [c - 1 for c in coord]

802

803

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

804

coord = [c % self.storage_shape[idx] for idx, c in enumerate(coord)]

805

806

strides, augmented_coord = self.get_strides_and_coord(coord)

if strides is None:

return None

if is_top_box:

address_offset += 1 * strides[-1] # one element

812

813

address_offset += np.dot(augmented_coord, strides)

814

815

assert address_offset >= 0

816

assert address_offset <= self.storage_size()

817

return address_offset

818

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

819

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

820

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

821

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

822

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

823

return self.equivalence_id == tens.equivalence_id

824

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

825

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

826

self.shape = shape

827

self.storage_shape = shape

828

self.bandwidth_shape = shape

829

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

830

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

831

d = len(self.shape)

832

if d in (1, 3):

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

833

return numeric_util.full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

834

elif d == 2:

835

return [self.shape[0], 1, 1, self.shape[1]]

836

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

837

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

838

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

839

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

840

# a tensor is quantized if it has an integral type and it contains valid quantization params

841

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

842

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

843

return False

844

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

845

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

846

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

847

def __lt__(self, other: "Tensor") -> bool:

848

return self.equivalence_id < other.equivalence_id

849

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

850

def __str__(self):

851

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

852

853

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

854

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame^]

855

def error(self, msg):

856

"""

857

Raises a VelaError exception for errors encountered when parsing a Tensor

858

859

:param self: Tensor object that resulted in the error

860

:param msg: str object that contains a description of the specific error encountered

861

"""

862

863

def _print_operators(ops):

864

lines = []

865

for idx, op in enumerate(ops):

866

op_type = getattr(op, "type", "Not an Operation")

867

op_id = getattr(op, "op_index", "-")

868

lines.append(f" {idx} = {op_type} ({op_id})")

869

return lines

870

871

lines = [f"Invalid {self.name} tensor. {msg}"]

872

873

lines += [" Driving operators:"]

874

lines += _print_operators(self.ops)

875

876

lines += [" Consuming operators:"]

877

lines += _print_operators(self.consumer_list)

878

879

raise VelaError("\n".join(lines))

880

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

881

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

882

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

883

# checks that the scaling of two quantized tensors are equal

884

Tim Hall