Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

1

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

39

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

40

from .numeric_util import full_shape

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

43

44

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

45

46

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

47

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

54

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

55

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

56

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

57

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

58

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

59

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

60

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

61

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

62

def all():

63

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

69

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

75

return self.name

76

77

def identifier_name(self):

78

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

83

84

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

85

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

91

Shram = 5 # for LUT

92

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

93

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

94

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

95

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

96

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

97

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

98

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

99

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

100

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

101

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

102

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

a0c3624

2020-06-03 15:43:31 +0200

[diff] [blame]

113

LUT = 4

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

114

FSBias = 5

115

Size = 6

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

116

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

117

def display_name(self) -> str:

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

118

return ("Unknown", "Weights", "FeatureMap", "Scratch", "LUT", "FastStorageBias", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

119

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

120

def identifier_name(self) -> str:

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

121

return ("unknown", "weights", "feature_map", "scratch", "lut", "fast_storage_bias", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

122

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

123

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

124

def all():

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

125

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

126

127

128

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

135

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

136

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

137

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

138

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

139

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

140

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

def all():

143

return (

144

TensorSubPurpose.Standard,

145

TensorSubPurpose.DoubleBuffer,

146

TensorSubPurpose.RollingBufferX,

147

TensorSubPurpose.RollingBufferY,

148

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

153

Unknown = 0

154

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

169

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

180

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

189

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

190

new_shp = list(shp)

191

192

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

193

for i in range(-1, -len(shp) - 1, -1):

194

if new_shp[i] is not None:

195

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

199

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

200

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

201

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

205

class QuantizationParameters:

206

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

207

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

208

def __init__(

209

self,

210

min: Union[float, np.ndarray, None] = None,

211

max: Union[float, np.ndarray, None] = None,

212

num_bits=None,

213

narrow_range=None,

214

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

219

self.narrow_range = narrow_range

220

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

221

self.scale_f32: Union[float, np.ndarray, None] = None

222

self.zero_point: Union[int, np.ndarray, None] = None

223

self.quant_min: Optional[float] = None

224

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

225

226

def __str__(self):

227

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

237

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

238

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

243

res.narrow_range = self.narrow_range

244

245

res.scale_f32 = self.scale_f32

246

res.zero_point = self.zero_point

247

res.quant_min = self.quant_min

248

res.quant_max = self.quant_max

249

return res

250

251

def dequantize(self, values):

252

if self.zero_point.size == 1 and self.scale_f32.size == 1:

253

# same scale is used for all values

254

res = (values.astype(np.float64) - self.zero_point) * self.scale_f32

255

else:

256

# a different scale is used for different sets of values

257

values_as_float = values.astype(np.float64)

258

259

# this is not compatible with the format of depthwise weights,

260

# where input is at index 3 (Output, Kh, Kw, Input)

261

# return the quantized values

262

return np.ndarray((values_as_float.shape))

263

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

264

return res

265

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

266

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

267

# quantisation parameter scaling is not equal if 'other' is None because

268

# it implies that the tensor it belongs to is not quantised. otherwise,

269

# it depends upon whether the scale and zero point are equal

270

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

271

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

272

return False

273

274

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

275

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

276

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

277

# quantisation parameters are consider valid if they have a scale and zero point

278

279

return None not in (self.scale_f32, self.zero_point)

280

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

281

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

282

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

283

for attr in ("scale_f32", "zero_point", "min", "max"):

284

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

288

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

289

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

295

purpose: TensorPurpose = TensorPurpose.Unknown,

296

quantization: QuantizationParameters = None,

297

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

298

# Tensor

299

const_tensor = Tensor(shape, dtype, name + "_0")

300

const_tensor.purpose = purpose

301

const_tensor.quantization = quantization

302

const_tensor.values = np.array(values, dtype=value_dtype)

Jacob Bohlin

a41cd4d

2020-08-26 18:21:28 +0200

[diff] [blame]

303

const_tensor.quant_values = np.frombuffer(const_tensor.values.tobytes(), dtype=np.uint8)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

304

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

305

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

306

const_op.set_output_tensor(const_tensor)

return const_tensor

def create_reshape_tensor(tens, shape, ifm_reshape=True):

311

if shape == tens.shape:

312

return tens

313

# Tensors

314

name = tens.name + "_reshape"

315

reshape_ifm = tens

316

reshape_ofm = tens.clone("_reshaped")

317

reshape_ofm.set_all_shapes(shape)

318

if not ifm_reshape:

319

reshape_ifm, reshape_ofm = reshape_ofm, reshape_ifm

320

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

321

reshape_op = Operation(Op.Reshape, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

322

reshape_op.attrs["new_shape"] = shape

323

reshape_op.add_input_tensor(reshape_ifm)

324

reshape_op.add_input_tensor(create_const_tensor(name + "_shape", [1], DataType.int32, shape))

325

reshape_op.set_output_tensor(reshape_ofm)

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

326

reshape_op.ifm_shapes.append(full_shape(4, reshape_ifm.shape, 1))

327

reshape_op.ofm_shapes.append(full_shape(4, reshape_ofm.shape, 1))

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

328

return reshape_ofm if ifm_reshape else reshape_ifm

329

330

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

331

# class that keeps track of all tensor addresses in the different memory types

332

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

333

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

334

335

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

336

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

337

return cls.address_map[tens_id].get(mem_type)

338

339

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

340

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

341

# Check previous address if there is one

342

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

343

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

344

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

345

346

# Set tensor's address for memory type

347

cls.address_map[tens_id][mem_type] = address

348

349

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

350

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

"ops",

"consumer_list",

"values",

"quant_values",

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

363

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

364

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

365

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

371

"storage_compression_scale",

372

"bandwidth_compression_scale",

373

"compression_scale_for_worst_weight_stream",

374

"weight_compression_scales",

375

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

376

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

377

"storage_rounding_quantum",

378

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

379

"quantization",

380

"weight_compressed_offsets",

381

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

382

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

383

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

384

"resampling_mode",

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

385

"avoid_NHCWB16",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

386

)

387

AllocationQuantum = 16

388

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

389

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

390

self.shape = shape

391

self.storage_shape = shape

392

self.bandwidth_shape = shape

393

self.dtype = dtype

394

self.name = name

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

395

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

396

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

397

self.ops: List[Operation] = []

398

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

399

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

400

self.values: Optional[np.ndarray] = None

401

self.quant_values: Optional[np.ndarray] = None

402

self.compressed_values: Optional[np.ndarray] = None

403

self.compressed_values_substream_offsets: Optional[List] = None

404

self.mem_area: MemArea = MemArea.Unknown

405

self.mem_type: MemType = MemType.Unknown

406

self.format: TensorFormat = TensorFormat.Unknown

407

self.purpose: TensorPurpose = TensorPurpose.Unknown

408

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

409

self.alignment: int = Tensor.AllocationQuantum

410

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

411

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

412

self.storage_compression_scale: float = 1.0

413

self.bandwidth_compression_scale: float = 1.0

414

self.compression_scale_for_worst_weight_stream: float = 1.0

415

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

416

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

417

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

418

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

419

self.value_id: UUID = uuid.uuid4()

420

self.weight_compressed_offsets: List = []

421

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

422

self.brick_size: Tuple = (1, 1, 1, 1)

423

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

424

425

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

426

self.quantization: Optional[QuantizationParameters] = None

427

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

428

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

429

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

430

self.avoid_NHCWB16: bool = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

431

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

432

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

433

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

434

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

435

436

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

437

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

438

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

439

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

440

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

441

if self.element_size_bytes == 0:

442

return self.dtype.size_in_bits() / 8

443

return self.element_size_bytes

444

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

445

# Returns a copy, renamed to self.name + suffix

446

# The references to Operators will be empty when returned

447

# Depending on set_unique, the copy is shallow, or deep

448

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

449

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

450

if set_unique:

451

res = copy.deepcopy(self)

452

res.equivalence_id = uuid.uuid4()

453

else:

454

res = copy.copy(self)

455

res.storage_shape = list(self.storage_shape)

456

res.bandwidth_shape = list(self.bandwidth_shape)

457

if self.quantization is not None:

458

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

459

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

460

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

461

res.ops = []

462

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

463

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

464

return res

465

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

466

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

467

res = self.clone(suffix="_fast_storage")

468

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

469

res.mem_type = MemType.Scratch_fast

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

470

return res

471

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

472

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

473

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

474

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

475

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

476

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

477

self.storage_shape = src_tens.storage_shape

478

self.brick_size = src_tens.brick_size

479

self.weight_compression_scales = src_tens.weight_compression_scales

480

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

481

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

482

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

483

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

484

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

485

self.block_traversal = src_tens.block_traversal

486

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

487

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

488

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

489

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

497

if shape_len > 4:

498

return

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

499

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

500

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

501

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

502

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

503

if self.shape is None:

504

return

505

506

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

507

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

508

509

if fmt == TensorFormat.WeightsCompressed:

510

compression_ratio = 5 / 8

511

self.storage_compression_scale = compression_ratio

512

self.bandwidth_compression_scale = compression_ratio

513

self.compression_scale_for_worst_weight_stream = compression_ratio

514

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

515

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

516

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

521

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

522

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

527

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

528

return shape_fully_defined(self.shape)

529

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

530

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

531

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

532

if raw_size == 0:

533

raw_size = 1 # force it to take up space

534

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

535

return rounded_size

536

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

537

def storage_size_for_sub_purpose(

538

self, arch, sub_purpose: TensorSubPurpose, param_a: Optional[int] = None, param_b: Optional[int] = None

539

) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

540

alt_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

541

elems = shape_num_elements(alt_shape)

542

if elems is None:

543

return 0

544

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

545

raw_size = (

546

elems

547

* self.element_size()

548

* self.compression_scale_for_worst_weight_stream

549

* arch.weight_estimation_scaling

550

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

551

else:

Patrik Gustavsson

9baa4c3

2020-08-20 13:59:01 +0200

[diff] [blame]

552

# Rolling buffers are used for intermediate data in ifm streaming

553

# These will all use the NHCWB16 format, and need to be aligned to 16 in the C-dimension

554

if alt_shape[-1] % 16 != 0:

555

nhcwb16_shape = alt_shape[0:-1] + [numeric_util.round_up(alt_shape[-1], 16)]

556

elems = shape_num_elements(nhcwb16_shape)

557

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

558

raw_size = elems * self.element_size() * self.storage_compression_scale

559

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

560

return rounded_size

561

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

562

def storage_shape_for_sub_purpose(

563

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

564

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

565

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

566

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

567

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

568

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

569

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

570

else:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

571

shp = list(self.storage_shape)

572

if sub_purpose == TensorSubPurpose.RollingBufferX:

573

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

574

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

575

shp[0] = 1

576

shp[2] = min(shp[2], param_a)

577

elif sub_purpose == TensorSubPurpose.RollingBufferY:

578

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

579

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

580

shp[0] = 1

581

shp[1] = min(shp[1], param_a)

582

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

583

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

584

assert param_a is not None

585

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

586

shp[0] = 1

587

shp[2] = min(shp[2], param_a)

588

shp[1] = min(shp[1], param_b)

589

elif sub_purpose == TensorSubPurpose.Standard:

590

pass

591

else:

592

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

593

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

594

return shp

595

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

596

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

597

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

598

self.sub_purpose = sub_purpose

599

if sub_purpose == TensorSubPurpose.DoubleBuffer:

600

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

601

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

602

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

603

elems = shape_num_elements(self.bandwidth_shape)

604

if elems is None:

605

return 0

606

return elems * self.element_size() * self.bandwidth_compression_scale

607

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

608

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

609

return self.consumer_list

610

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

611

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, fm_shape: Shape) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

612

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

613

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

614

if self.storage_shape == []:

return (

1,

1,

1,

[self.address_for_coordinate(start_coord, shape=fm_shape), None, None, None],

620

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

621

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

622

storage_shape_4D = full_shape(4, self.storage_shape, 1)

623

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D[1])

624

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D[2])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

625

626

crossing_y = min(crossing_y, end_coord[1])

627

crossing_x = min(crossing_x, end_coord[2])

628

629

box_height0 = crossing_y - start_coord[1]

630

box_width = crossing_x - start_coord[2]

631

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

632

addresses: List = [None] * 4

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

633

addresses[0] = self.address_for_coordinate(start_coord, shape=fm_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

634

635

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

636

addresses[1] = self.address_for_coordinate(

637

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], shape=fm_shape

638

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

639

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

640

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

641

addresses[2] = self.address_for_coordinate(

642

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], shape=fm_shape

643

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

644

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

645

addresses[3] = self.address_for_coordinate(

646

[start_coord[0], crossing_y, crossing_x, start_coord[3]], shape=fm_shape

647

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

648

649

return box_height0, box_height0, box_width, addresses

650

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

651

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, shape: Shape = None) -> int:

652

if shape is None:

653

shape = self.shape

654

offset = self.address_offset_for_coordinate(coord, shape, is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

655

assert offset is not None

656

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

657

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

658

def get_strides_and_coord(self, coord: Optional[Shape] = None) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

659

if coord is None:

660

coord = [0] * len(self.storage_shape)

661

662

augmented_coord = coord

663

augmented_shape = self.storage_shape

664

while len(augmented_shape) < 4:

665

augmented_shape = [1] + augmented_shape

666

667

while len(augmented_coord) < 4:

668

augmented_coord = [0] + augmented_coord

669

670

assert len(augmented_coord) == len(augmented_shape)

671

672

if self.format == TensorFormat.NHWC:

673

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

674

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

675

676

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

677

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

678

augmented_shape = augmented_shape[0:4] + [1]

679

augmented_coord = (

680

[augmented_coord[0], augmented_coord[3] // channel_divisor]

681

+ augmented_coord[1:3]

682

+ [augmented_coord[3] % channel_divisor]

683

)

684

685

if augmented_shape[1] == 0:

686

augmented_shape[1] = 1

687

688

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

689

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

690

return None, None

691

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

692

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

693

stride = self.element_size() * self.storage_compression_scale

694

695

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

696

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

697

for i in stride_order:

698

strides[i] = stride

699

stride *= augmented_shape[i]

700

else:

701

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

702

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

703

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

704

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

705

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

706

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

707

708

return strides, augmented_coord

709

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

710

def get_strides(self) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

711

strides, _ = self.get_strides_and_coord()

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

712

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

713

return strides

714

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

715

def needs_dma(self) -> bool:

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

716

return len(self.ops) == 1 and self.ops[0].type == Op.DMA

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

717

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

718

def get_dma_src_tensor(self) -> "Optional[Tensor]":

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

719

# For weight tensors that need DMA: returns the source tensor in Flash, else None

720

# Note: for DMA ops, Pass.weight_tensor is referring to the SRAM weight tensor

721

return self.ops[0].inputs[0] if self.needs_dma() else None

722

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

723

def find_npu_op(self) -> Optional[Operation]:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

724

# Returns the NPU operator that uses this tensor, excluding DMA operators.

725

for op in self.consumers():

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

726

if op.type == Op.DMA:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

727

return op.outputs[0].find_npu_op()

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

728

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

729

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

730

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

731

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

732

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

733

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

734

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

735

assert len(self.compressed_values) > 0

736

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

737

738

depth = coord[-1]

739

brick_depth = self.brick_size[-1]

740

# Clamp position at final element index

741

if depth > self.shape[-1]:

742

depth = self.shape[-1]

743

744

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

745

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

746

747

# Check boundaries on all but last weight set (which may be shorter

748

# than the brick we divided it up into)

749

if index < len(self.weight_compressed_offsets) - 1:

750

# There are no half-way points in the weights

751

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

752

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

756

def size_of_compressed_stream(self, index: int) -> int:

757

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

758

assert 0 <= index < len(self.compressed_values)

759

return len(self.compressed_values[index])

760

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

761

def is_last_index_in_compressed_stream(self, index: int) -> bool:

762

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

763

assert 0 <= index < len(self.compressed_values)

764

return index == len(self.compressed_values) - 1

765

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

766

def address_offset_for_coordinate(self, orig_coord: Shape, shape: Shape, is_top_box: bool = False) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

address_offset = 0

coord = orig_coord

coord = coord[-len(self.storage_shape) :]

771

772

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

773

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

774

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

775

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

776

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

777

assert c >= 0 and c < shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

778

779

if self.format == TensorFormat.WeightsCompressed:

780

if len(self.weight_compressed_offsets) == 0:

781

return 0

782

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

783

if self.needs_dma() and self.sub_purpose == TensorSubPurpose.DoubleBuffer:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

784

depth = orig_coord[-1]

785

brick_depth = self.brick_size[-1]

786

# Clamp position at final element index

787

if depth > self.shape[-1]:

788

depth = self.shape[-1]

789

790

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

791

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

792

index = index % 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

793

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

794

795

if len(self.compressed_values) <= 2:

796

if is_top_box and index == 0:

797

for cv in self.compressed_values:

798

address_offset += len(cv)

799

else:

800

address_offset = index * len(self.compressed_values[0])

801

else:

802

if is_top_box and index == 0:

803

address_offset = self.storage_shape[-1]

804

else:

805

address_offset = index * (self.storage_shape[-1] // 2)

806

else:

807

index = self.compressed_stream_index_from_coord(orig_coord)

808

assert index < len(self.weight_compressed_offsets)

809

address_offset = self.weight_compressed_offsets[index]

810

else:

811

if is_top_box:

812

coord = [c - 1 for c in coord]

813

814

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

815

coord = [c % self.storage_shape[idx] for idx, c in enumerate(coord)]

816

817

strides, augmented_coord = self.get_strides_and_coord(coord)

if strides is None:

return None

if is_top_box:

address_offset += 1 * strides[-1] # one element

823

824

address_offset += np.dot(augmented_coord, strides)

825

826

assert address_offset >= 0

827

assert address_offset <= self.storage_size()

828

return address_offset

829

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

830

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

831

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

832

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

833

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

834

return self.equivalence_id == tens.equivalence_id

835

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

836

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

837

self.shape = shape

838

self.storage_shape = shape

839

self.bandwidth_shape = shape

840

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

841

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

842

d = len(self.shape)

843

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame^]

844

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

845

elif d == 2:

846

return [self.shape[0], 1, 1, self.shape[1]]

847

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

848

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

849

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

850

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

851

# a tensor is quantized if it has an integral type and it contains valid quantization params

852

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

853

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

854

return False

855

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

856

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

857

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

858

def __lt__(self, other: "Tensor") -> bool:

859

return self.equivalence_id < other.equivalence_id

860

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

861

def __str__(self):

862

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

863

864

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

865

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

866

def error(self, msg):

867

"""

868

Raises a VelaError exception for errors encountered when parsing a Tensor

869

870

:param self: Tensor object that resulted in the error

871

:param msg: str object that contains a description of the specific error encountered

872

"""

873

874

def _print_operators(ops):

875

lines = []

876

for idx, op in enumerate(ops):

877

op_type = getattr(op, "type", "Not an Operation")

878

op_id = getattr(op, "op_index", "-")

879

lines.append(f" {idx} = {op_type} ({op_id})")

880

return lines

881

882

lines = [f"Invalid {self.name} tensor. {msg}"]

883

884

lines += [" Driving operators:"]

885

lines += _print_operators(self.ops)

886

887

lines += [" Consuming operators:"]

888

lines += _print_operators(self.consumer_list)

889

890

raise VelaError("\n".join(lines))

891

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

892

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

893

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

894

# checks that the scaling of two quantized tensors are equal

895

Tim Hall