Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

39

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

120

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

121

self.value

122

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

124

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

125

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

126

self.value

127

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

128

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

129

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

130

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

131

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

132

133

134

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

143

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

144

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

145

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

146

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

147

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

148

def all():

149

return (

150

TensorSubPurpose.Standard,

151

TensorSubPurpose.DoubleBuffer,

152

TensorSubPurpose.RollingBufferX,

153

TensorSubPurpose.RollingBufferY,

154

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

159

Unknown = 0

160

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

175

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

195

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

196

new_shp = list(shp)

197

198

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

199

for i in range(-1, -len(shp) - 1, -1):

200

if new_shp[i] is not None:

201

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

205

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

206

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

207

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

211

class QuantizationParameters:

212

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

213

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

214

def __init__(

215

self,

216

min: Union[float, np.ndarray, None] = None,

217

max: Union[float, np.ndarray, None] = None,

218

num_bits=None,

219

narrow_range=None,

220

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

225

self.narrow_range = narrow_range

226

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

227

self.scale_f32: Union[float, np.ndarray, None] = None

228

self.zero_point: Union[int, np.ndarray, None] = None

229

self.quant_min: Optional[float] = None

230

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

231

232

def __str__(self):

233

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

243

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

244

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

249

res.narrow_range = self.narrow_range

250

251

res.scale_f32 = self.scale_f32

252

res.zero_point = self.zero_point

253

res.quant_min = self.quant_min

254

res.quant_max = self.quant_max

255

return res

256

257

def dequantize(self, values):

258

if self.zero_point.size == 1 and self.scale_f32.size == 1:

259

# same scale is used for all values

260

res = (values.astype(np.float64) - self.zero_point) * self.scale_f32

261

else:

262

# a different scale is used for different sets of values

263

values_as_float = values.astype(np.float64)

264

265

# this is not compatible with the format of depthwise weights,

266

# where input is at index 3 (Output, Kh, Kw, Input)

267

# return the quantized values

268

return np.ndarray((values_as_float.shape))

269

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

270

return res

271

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

272

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

273

# quantisation parameter scaling is not equal if 'other' is None because

274

# it implies that the tensor it belongs to is not quantised. otherwise,

275

# it depends upon whether the scale and zero point are equal

276

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

277

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

278

return False

279

280

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

281

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

282

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

283

# quantisation parameters are consider valid if they have a scale and zero point

284

285

return None not in (self.scale_f32, self.zero_point)

286

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

287

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

288

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

289

for attr in ("scale_f32", "zero_point", "min", "max"):

290

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

294

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

295

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

301

purpose: TensorPurpose = TensorPurpose.Unknown,

302

quantization: QuantizationParameters = None,

Dwight Lidman

9b37918

2021-03-15 19:06:10 +0100

[diff] [blame]

303

quant_value_dtype: np.dtype = None,

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

304

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

305

# Tensor

306

const_tensor = Tensor(shape, dtype, name + "_0")

307

const_tensor.purpose = purpose

308

const_tensor.quantization = quantization

309

const_tensor.values = np.array(values, dtype=value_dtype)

Dwight Lidman

9b37918

2021-03-15 19:06:10 +0100

[diff] [blame]

310

const_tensor.quant_values = np.frombuffer(

311

const_tensor.values.tobytes(), dtype=np.uint8 if not quant_value_dtype else quant_value_dtype

312

)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

313

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

314

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

315

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

316

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

320

# class that keeps track of all tensor addresses in the different memory types

321

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

322

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

323

324

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

325

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

326

return cls.address_map[tens_id].get(mem_type)

327

328

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

329

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

330

# Check previous address if there is one

331

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

332

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

333

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

334

335

# Set tensor's address for memory type

336

cls.address_map[tens_id][mem_type] = address

337

338

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

339

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

347

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

348

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"ops",

"consumer_list",

"values",

"quant_values",

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

354

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

355

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

356

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

362

"storage_compression_scale",

363

"bandwidth_compression_scale",

364

"compression_scale_for_worst_weight_stream",

365

"weight_compression_scales",

366

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

367

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

368

"storage_rounding_quantum",

369

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

370

"quantization",

371

"weight_compressed_offsets",

372

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

374

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

375

"resampling_mode",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

376

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

377

"needs_linear_format",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

378

)

379

AllocationQuantum = 16

380

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

381

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

382

self.shape = shape

383

self.storage_shape = shape

384

self.bandwidth_shape = shape

385

self.dtype = dtype

386

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

387

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

388

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

389

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

390

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

391

self.ops: List[Operation] = []

392

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

393

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

394

self.values: Optional[np.ndarray] = None

395

self.quant_values: Optional[np.ndarray] = None

396

self.compressed_values: Optional[np.ndarray] = None

397

self.compressed_values_substream_offsets: Optional[List] = None

398

self.mem_area: MemArea = MemArea.Unknown

399

self.mem_type: MemType = MemType.Unknown

400

self.format: TensorFormat = TensorFormat.Unknown

401

self.purpose: TensorPurpose = TensorPurpose.Unknown

402

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

403

self.alignment: int = Tensor.AllocationQuantum

404

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

406

self.storage_compression_scale: float = 1.0

407

self.bandwidth_compression_scale: float = 1.0

408

self.compression_scale_for_worst_weight_stream: float = 1.0

409

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

410

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

411

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

412

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

413

self.value_id: UUID = uuid.uuid4()

414

self.weight_compressed_offsets: List = []

415

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

416

self.brick_size: Tuple = (1, 1, 1, 1)

417

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

418

419

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

420

self.quantization: Optional[QuantizationParameters] = None

421

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

422

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

423

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

424

self.needs_linear_format = True

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

425

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

426

# Reference to parent-tensor if this tensor is a clone

427

self.src_tensor = None

428

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

429

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

430

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

431

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

432

433

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

434

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

435

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

436

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

437

@property

438

def is_standard_fm(self) -> bool:

439

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

440

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

441

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

442

if self.element_size_bytes == 0:

443

return self.dtype.size_in_bits() / 8

444

return self.element_size_bytes

445

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

446

# Returns a copy, renamed to self.name + suffix

447

# The references to Operators will be empty when returned

448

# Depending on set_unique, the copy is shallow, or deep

449

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

450

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

451

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

452

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

453

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

454

res.storage_shape = list(self.storage_shape)

455

res.bandwidth_shape = list(self.bandwidth_shape)

456

if self.quantization is not None:

457

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

458

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

459

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

460

res.ops = []

461

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

462

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

463

return res

464

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

465

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

466

res = self.clone(suffix="_fast_storage")

467

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

468

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

469

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

470

return res

471

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

472

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

473

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

474

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

475

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

476

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

477

self.storage_shape = src_tens.storage_shape

478

self.brick_size = src_tens.brick_size

479

self.weight_compression_scales = src_tens.weight_compression_scales

480

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

481

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

482

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

483

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

484

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

485

self.block_traversal = src_tens.block_traversal

486

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

487

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

488

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

489

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

497

if shape_len > 4:

498

return

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

499

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

500

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

501

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

502

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

503

if self.shape is None:

504

return

505

506

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

507

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

508

509

if fmt == TensorFormat.WeightsCompressed:

510

compression_ratio = 5 / 8

511

self.storage_compression_scale = compression_ratio

512

self.bandwidth_compression_scale = compression_ratio

513

self.compression_scale_for_worst_weight_stream = compression_ratio

514

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

515

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

516

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

521

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

522

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

527

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

528

return shape_fully_defined(self.shape)

529

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

530

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

531

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

532

if raw_size == 0:

533

raw_size = 1 # force it to take up space

534

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

535

return rounded_size

536

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

537

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

538

elems = shape_num_elements(op_storage_shape)

539

elems = elems if elems else 0

540

raw_size = elems * self.element_size()

541

if raw_size == 0:

542

raw_size = 1 # force it to take up space

543

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

544

return rounded_size

545

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

546

def storage_shape_for_sub_purpose(

547

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

548

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

549

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

550

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

551

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

552

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

553

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

554

else:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

555

shp = list(self.storage_shape)

556

if sub_purpose == TensorSubPurpose.RollingBufferX:

557

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

558

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

559

shp[0] = 1

560

shp[2] = min(shp[2], param_a)

561

elif sub_purpose == TensorSubPurpose.RollingBufferY:

562

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

563

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

564

shp[0] = 1

565

shp[1] = min(shp[1], param_a)

566

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

567

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

568

assert param_a is not None

569

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

570

shp[0] = 1

571

shp[2] = min(shp[2], param_a)

572

shp[1] = min(shp[1], param_b)

573

elif sub_purpose == TensorSubPurpose.Standard:

574

pass

575

else:

576

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

577

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

578

return shp

579

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

580

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

581

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

582

self.sub_purpose = sub_purpose

583

if sub_purpose == TensorSubPurpose.DoubleBuffer:

584

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

585

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

586

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

587

elems = shape_num_elements(self.bandwidth_shape)

588

if elems is None:

589

return 0

590

return elems * self.element_size() * self.bandwidth_compression_scale

591

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

592

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

593

return self.consumer_list

594

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

595

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

596

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

597

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

598

599

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, op_shape4D: Shape4D) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

600

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

601

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

602

if self.storage_shape == []:

return (

1,

1,

1,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

607

[self.address_for_coordinate(start_coord, op_shape4D=op_shape4D), None, None, None],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

608

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

609

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

610

if self.is_standard_fm:

611

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

612

else:

613

storage_shape_4D = Shape4D(self.storage_shape)

614

615

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

616

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

617

618

crossing_y = min(crossing_y, end_coord[1])

619

crossing_x = min(crossing_x, end_coord[2])

620

621

box_height0 = crossing_y - start_coord[1]

622

box_width = crossing_x - start_coord[2]

623

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

624

addresses: List = [None] * 4

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

625

addresses[0] = self.address_for_coordinate(start_coord, op_shape4D=op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

626

627

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

628

addresses[1] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

629

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

630

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

631

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

632

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

633

addresses[2] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

634

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

635

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

636

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

637

addresses[3] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

638

[start_coord[0], crossing_y, crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

639

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

640

641

return box_height0, box_height0, box_width, addresses

642

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

643

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, op_shape4D: Shape4D = None) -> int:

644

offset = self.address_offset_for_coordinate(coord, op_shape4D=op_shape4D, is_top_box=is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

645

assert offset is not None

646

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

647

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

648

def get_strides_and_coord(

649

self, coord: Optional[Shape] = None, shape4D: Optional[Shape4D] = None

650

) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

651

if coord is None:

652

coord = [0] * len(self.storage_shape)

653

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

654

if shape4D and self.is_standard_fm:

655

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

656

else:

657

augmented_shape = full_shape(4, self.storage_shape, 1)

658

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

659

augmented_coord = coord

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

660

661

while len(augmented_coord) < 4:

662

augmented_coord = [0] + augmented_coord

663

664

assert len(augmented_coord) == len(augmented_shape)

665

666

if self.format == TensorFormat.NHWC:

667

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

668

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

669

670

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

671

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

672

augmented_shape = augmented_shape[0:4] + [1]

673

augmented_coord = (

674

[augmented_coord[0], augmented_coord[3] // channel_divisor]

675

+ augmented_coord[1:3]

676

+ [augmented_coord[3] % channel_divisor]

677

)

678

679

if augmented_shape[1] == 0:

680

augmented_shape[1] = 1

681

682

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

683

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

684

return None, None

685

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

686

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

687

stride = self.element_size() * self.storage_compression_scale

688

689

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

690

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

691

for i in stride_order:

692

strides[i] = stride

693

stride *= augmented_shape[i]

694

else:

695

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

696

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

697

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

698

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

699

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

700

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

701

702

return strides, augmented_coord

703

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

704

def get_strides(self, shape4D: Optional[Shape4D] = None) -> Shape:

705

strides, _ = self.get_strides_and_coord(shape4D=shape4D)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

706

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

707

return strides

708

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

709

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

710

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

711

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

712

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

713

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

714

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

715

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

716

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

717

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

718

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

719

assert len(self.compressed_values) > 0

720

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

721

722

depth = coord[-1]

723

brick_depth = self.brick_size[-1]

724

# Clamp position at final element index

725

if depth > self.shape[-1]:

726

depth = self.shape[-1]

727

728

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

729

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

730

731

# Check boundaries on all but last weight set (which may be shorter

732

# than the brick we divided it up into)

733

if index < len(self.weight_compressed_offsets) - 1:

734

# There are no half-way points in the weights

735

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

736

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

740

def size_of_compressed_stream(self, index: int) -> int:

741

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

742

assert 0 <= index < len(self.compressed_values)

743

return len(self.compressed_values[index])

744

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

745

def is_last_index_in_compressed_stream(self, index: int) -> bool:

746

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

747

assert 0 <= index < len(self.compressed_values)

748

return index == len(self.compressed_values) - 1

749

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

750

def address_offset_for_coordinate(

751

self, orig_coord: Shape, op_shape4D: Optional[Shape4D] = None, is_top_box: bool = False

752

) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

753

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

754

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

755

756

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

757

shape = op_shape4D.as_list() if op_shape4D else self.shape

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

758

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

759

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

760

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

761

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

762

assert c >= 0 and c < shape[idx]

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

763

coord = orig_coord

764

if op_shape4D and self.is_standard_fm:

765

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

766

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

767

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

768

storage_shape = self.storage_shape

769

coord = coord[-len(storage_shape) :]

770

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

771

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

772

if is_top_box:

773

coord = [c - 1 for c in coord]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

774

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

775

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

776

coord = [c % storage_shape[idx] for idx, c in enumerate(coord)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

777

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

778

strides, augmented_coord = self.get_strides_and_coord(coord, op_shape4D)

779

if strides is None:

780

return None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

781

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

782

if is_top_box:

783

address_offset += 1 * strides[-1] # one element

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

784

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

785

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

786

787

assert address_offset >= 0

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

788

assert address_offset <= storage_size

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

789

return address_offset

790

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

791

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

792

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

793

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

794

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

795

return self.equivalence_id == tens.equivalence_id

796

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

797

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

798

self.shape = shape

799

self.storage_shape = shape

800

self.bandwidth_shape = shape

801

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

802

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

803

d = len(self.shape)

804

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

805

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

806

elif d == 2:

807

return [self.shape[0], 1, 1, self.shape[1]]

808

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

809

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

810

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

811

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

812

# a tensor is quantized if it has an integral type and it contains valid quantization params

813

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

814

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

815

return False

816

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

817

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

818

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

819

def __lt__(self, other: "Tensor") -> bool:

820

return self.equivalence_id < other.equivalence_id

821

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

822

def __str__(self):

823

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

824

825

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

826

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

827

def error(self, msg):

828

"""

829

Raises a VelaError exception for errors encountered when parsing a Tensor

830

831

:param self: Tensor object that resulted in the error

832

:param msg: str object that contains a description of the specific error encountered

833

"""

834

835

def _print_operators(ops):

836

lines = []

837

for idx, op in enumerate(ops):

838

op_type = getattr(op, "type", "Not an Operation")

839

op_id = getattr(op, "op_index", "-")

840

lines.append(f" {idx} = {op_type} ({op_id})")

841

return lines

842

843

lines = [f"Invalid {self.name} tensor. {msg}"]

844

845

lines += [" Driving operators:"]

846

lines += _print_operators(self.ops)

847

848

lines += [" Consuming operators:"]

849

lines += _print_operators(self.consumer_list)

850

851

raise VelaError("\n".join(lines))

852

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

853

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

854

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

855

# checks that the scaling of two quantized tensors are equal

856

Tim Hall