Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2022-07-04 16:19:16 +0000

[diff] [blame]

1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

39

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

40

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

41

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

42

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

43

44

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

45

46

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

47

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

54

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

55

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

56

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

57

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

58

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

59

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

60

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

61

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

62

def all():

63

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

69

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

75

return self.name

76

77

def identifier_name(self):

78

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

83

84

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

85

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

91

Shram = 5 # for LUT

92

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

93

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

94

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

95

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

96

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

97

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

98

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

99

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

100

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

101

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

102

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

117

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

118

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

119

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

120

self.value

121

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

122

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

123

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

124

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

125

self.value

126

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

127

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

128

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

129

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

130

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

131

132

133

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

140

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

141

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

142

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

143

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

144

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

145

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

146

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

147

def all():

148

return (

149

TensorSubPurpose.Standard,

150

TensorSubPurpose.DoubleBuffer,

151

TensorSubPurpose.RollingBufferX,

152

TensorSubPurpose.RollingBufferY,

153

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

158

Unknown = 0

159

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

174

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

185

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

194

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

195

new_shp = list(shp)

196

197

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

198

for i in range(-1, -len(shp) - 1, -1):

199

if new_shp[i] is not None:

200

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

204

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

205

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

206

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

210

class QuantizationParameters:

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

__slots__ = (

"min",

"max",

"num_bits",

"narrow_range",

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

216

"next_after",

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

"scale_f32",

"zero_point",

"quant_min",

"quant_max",

"quant_dim",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

223

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

224

def __init__(

225

self,

226

min: Union[float, np.ndarray, None] = None,

227

max: Union[float, np.ndarray, None] = None,

228

num_bits=None,

229

narrow_range=None,

230

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

235

self.narrow_range = narrow_range

236

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

237

# Use the 'next after' float value of scale_f32 when converting to scale and shift. It can be combined with

238

# natural rounding to perform rounding away from zero. This only affects the ofm scale and bias tensor, it has

239

# no affect on global scaling i.e. the ofm_scale register

240

self.next_after = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

241

self.scale_f32: Union[float, np.ndarray, None] = None

242

self.zero_point: Union[int, np.ndarray, None] = None

243

self.quant_min: Optional[float] = None

244

self.quant_max: Optional[float] = None

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

245

self.quant_dim: Optional[int] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

246

247

def __str__(self):

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

248

return (

249

f"<nng.QuantizationParameters min={self.min}, max={self.max}, num_bits={self.num_bits}, "

250

f"scale={self.scale_f32}, zero_point={self.zero_point}, next={self.next_after}>"

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

255

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

256

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

261

res.narrow_range = self.narrow_range

262

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

263

res.next_after = self.next_after

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

264

res.scale_f32 = self.scale_f32

265

res.zero_point = self.zero_point

266

res.quant_min = self.quant_min

267

res.quant_max = self.quant_max

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

268

res.quant_dim = self.quant_dim

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

269

return res

270

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

271

def dequantize(self, values) -> np.ndarray:

272

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

273

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

274

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

275

"""

276

Returns True if the scale and zero point of self and other are equal. If other is None then the scaling is

277

not considered equal because the tensor is assumed to not be quantised and False will be returned

278

"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

279

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

280

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

281

return False

282

283

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

284

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

285

def is_valid(self) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

286

"""Return True if the quantisation parameters have a scale and zero point"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

287

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

288

return self.scale_f32 is not None and self.zero_point is not None

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

289

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

290

def is_per_axis(self) -> bool:

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

291

"""Returns True if either the scale, zero point, minimum or maximum values have more than one value"""

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

292

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

293

for attr in ("scale_f32", "zero_point", "min", "max"):

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

294

if np.size(getattr(self, attr)) > 1:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

298

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

299

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

305

purpose: TensorPurpose = TensorPurpose.Unknown,

306

quantization: QuantizationParameters = None,

307

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

308

# Tensor

309

const_tensor = Tensor(shape, dtype, name + "_0")

310

const_tensor.purpose = purpose

311

const_tensor.quantization = quantization

312

const_tensor.values = np.array(values, dtype=value_dtype)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

313

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

314

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

315

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

316

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

320

# class that keeps track of all tensor addresses in the different memory types

321

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

322

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

323

324

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

325

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

326

return cls.address_map[tens_id].get(mem_type)

327

328

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

329

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

330

# Check previous address if there is one

331

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

332

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

333

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

334

335

# Set tensor's address for memory type

336

cls.address_map[tens_id][mem_type] = address

337

338

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

339

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

347

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

348

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

349

"ops",

350

"consumer_list",

351

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

352

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

353

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

354

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

355

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

361

"storage_compression_scale",

362

"bandwidth_compression_scale",

363

"compression_scale_for_worst_weight_stream",

364

"weight_compression_scales",

365

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

366

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

367

"storage_rounding_quantum",

368

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

369

"quantization",

370

"weight_compressed_offsets",

371

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

372

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

"equivalence_id",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

374

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

375

"needs_linear_format",

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

376

"ifm_write_protected",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

377

)

378

AllocationQuantum = 16

379

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

380

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

381

self.shape = shape

382

self.storage_shape = shape

383

self.bandwidth_shape = shape

384

self.dtype = dtype

385

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

386

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

387

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

388

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

389

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

390

self.ops: List[Operation] = []

391

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

392

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

393

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

394

self.compressed_values: Optional[np.ndarray] = None

395

self.compressed_values_substream_offsets: Optional[List] = None

396

self.mem_area: MemArea = MemArea.Unknown

397

self.mem_type: MemType = MemType.Unknown

398

self.format: TensorFormat = TensorFormat.Unknown

399

self.purpose: TensorPurpose = TensorPurpose.Unknown

400

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

401

self.alignment: int = Tensor.AllocationQuantum

402

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

403

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

404

self.storage_compression_scale: float = 1.0

405

self.bandwidth_compression_scale: float = 1.0

406

self.compression_scale_for_worst_weight_stream: float = 1.0

407

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

408

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

409

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

410

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

411

self.value_id: UUID = uuid.uuid4()

412

self.weight_compressed_offsets: List = []

413

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

414

self.brick_size: Tuple = (1, 1, 1, 1)

415

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

416

417

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

418

self.quantization: Optional[QuantizationParameters] = None

419

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

420

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

421

self.needs_linear_format = True

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

422

self.ifm_write_protected = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

423

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

424

# Reference to parent-tensor if this tensor is a clone

Jonas Ohlsson

845e232

2022-03-01 12:39:55 +0100

[diff] [blame]

425

self.src_tensor: Optional[Tensor] = None

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

426

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

427

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

428

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

429

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

430

431

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

432

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

433

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

434

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

435

@property

436

def is_standard_fm(self) -> bool:

437

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

438

Johan Alfvén

0f2e59f

2022-10-21 11:21:38 +0200

[diff] [blame^]

439

@property

440

def is_const(self) -> bool:

441

return self.ops != [] and self.ops[0].type == Op.Const

442

443

@property

444

def is_scalar(self) -> bool:

445

return self.shape == [] and self.elements() == 1

446

447

def is_broadcast(self, ofm) -> bool:

448

return self.shape != ofm.shape

449

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

450

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

451

if self.element_size_bytes == 0:

Diqing Zhong

e3d18b0

2021-11-15 13:53:10 +0100

[diff] [blame]

452

return self.dtype.size_in_bits() // 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

453

return self.element_size_bytes

454

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

455

# Returns a copy, renamed to self.name + suffix

456

# The references to Operators will be empty when returned

457

# Depending on set_unique, the copy is shallow, or deep

458

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

459

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

460

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

461

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

462

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

463

res.storage_shape = list(self.storage_shape)

464

res.bandwidth_shape = list(self.bandwidth_shape)

465

if self.quantization is not None:

466

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

467

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

468

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

469

res.ops = []

470

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

471

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

472

return res

473

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

474

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

475

res = self.clone(suffix="_fast_storage")

476

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

477

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

478

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

479

return res

480

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

481

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

482

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

483

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

484

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

485

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

486

self.storage_shape = src_tens.storage_shape

487

self.brick_size = src_tens.brick_size

488

self.weight_compression_scales = src_tens.weight_compression_scales

489

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

490

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

491

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

492

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

493

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

494

self.block_traversal = src_tens.block_traversal

495

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

496

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

497

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

498

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

506

if shape_len > 4:

507

return

Louis Verhaard

04bd3e9

2021-08-19 16:36:32 +0200

[diff] [blame]

508

assert not (self.needs_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

509

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

510

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

511

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

512

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

513

if self.shape is None:

514

return

515

516

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

517

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

518

519

if fmt == TensorFormat.WeightsCompressed:

520

compression_ratio = 5 / 8

521

self.storage_compression_scale = compression_ratio

522

self.bandwidth_compression_scale = compression_ratio

523

self.compression_scale_for_worst_weight_stream = compression_ratio

524

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

525

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

526

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

531

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

532

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

537

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

538

return shape_fully_defined(self.shape)

539

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

540

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

541

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

542

if raw_size == 0:

543

raw_size = 1 # force it to take up space

544

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

545

return rounded_size

546

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

547

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

548

elems = shape_num_elements(op_storage_shape)

549

elems = elems if elems else 0

550

raw_size = elems * self.element_size()

551

if raw_size == 0:

552

raw_size = 1 # force it to take up space

553

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

554

return rounded_size

555

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

556

def storage_shape_for_sub_purpose(

557

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

558

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

559

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

560

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

561

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

562

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

563

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

564

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

565

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

566

if sub_purpose == TensorSubPurpose.RollingBufferX:

567

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

568

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

569

shp[0] = 1

570

shp[2] = min(shp[2], param_a)

571

elif sub_purpose == TensorSubPurpose.RollingBufferY:

572

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

573

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

574

shp[0] = 1

575

shp[1] = min(shp[1], param_a)

576

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

577

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

578

assert param_a is not None

579

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

580

shp[0] = 1

581

shp[2] = min(shp[2], param_a)

582

shp[1] = min(shp[1], param_b)

583

elif sub_purpose == TensorSubPurpose.Standard:

584

pass

585

else:

586

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

587

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

588

return shp

589

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

590

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

591

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

592

self.sub_purpose = sub_purpose

593

if sub_purpose == TensorSubPurpose.DoubleBuffer:

594

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

595

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

596

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

597

elems = shape_num_elements(self.bandwidth_shape)

598

if elems is None:

599

return 0

600

return elems * self.element_size() * self.bandwidth_compression_scale

601

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

602

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

603

return self.consumer_list

604

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

605

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

606

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

607

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

608

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

609

def addresses_for_rolling_buffer(

610

self, start_coord: Shape, end_coord: Shape, strides: List[int], op_shape4D: Shape4D

611

) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

612

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

613

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

614

if self.storage_shape == []:

return (

1,

1,

1,

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

619

[self.address_for_coordinate(start_coord, strides, op_shape4D), 0, 0, 0],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

620

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

621

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

622

if self.is_standard_fm:

623

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

624

else:

625

storage_shape_4D = Shape4D(self.storage_shape)

626

627

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

628

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

629

630

crossing_y = min(crossing_y, end_coord[1])

631

crossing_x = min(crossing_x, end_coord[2])

632

633

box_height0 = crossing_y - start_coord[1]

634

box_width = crossing_x - start_coord[2]

635

Rickard Bolin

9ae3455

2022-06-09 13:07:17 +0000

[diff] [blame]

636

addresses: List = [0] * 4

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

637

addresses[0] = self.address_for_coordinate(start_coord, strides, op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

638

639

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

640

addresses[1] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

641

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

642

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

643

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

644

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

645

addresses[2] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

646

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

647

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

648

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

649

addresses[3] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

650

[start_coord[0], crossing_y, crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

651

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

652

653

return box_height0, box_height0, box_width, addresses

654

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

655

def get_strides(self, shape4D: Optional[Shape4D]) -> List[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

656

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

657

augmented_shape = self.get_augmented_shape(shape4D)

658

assert len(augmented_shape) == 5

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

659

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

660

stride = self.element_size() * self.storage_compression_scale

661

662

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

663

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

664

for i in stride_order:

665

strides[i] = stride

666

stride *= augmented_shape[i]

667

else:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

668

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

669

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

670

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

671

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

672

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

673

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

674

return strides

675

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

676

def get_augmented_shape(self, shape4D: Optional[Shape4D] = None) -> Optional[Shape]:

677

678

if shape4D and self.is_standard_fm:

679

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

680

else:

681

augmented_shape = full_shape(4, self.storage_shape, 1)

682

683

if self.format == TensorFormat.NHWC:

684

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

685

686

elif self.format == TensorFormat.NHCWB16:

687

augmented_shape = augmented_shape[0:4] + [1]

688

689

if augmented_shape[1] == 0:

690

augmented_shape[1] = 1

691

692

else:

693

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

694

return None

695

696

return augmented_shape

697

698

def get_augmented_coord(self, coord: Optional[Shape] = None) -> Optional[Shape]:

699

if coord is None:

700

coord = [0] * min(len(self.storage_shape), 4)

701

702

missing_len = 4 - len(coord)

703

augmented_coord = ([0] * missing_len) + coord

704

705

if self.format == TensorFormat.NHWC:

706

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

707

708

elif self.format == TensorFormat.NHCWB16:

709

channel_divisor = 16

710

augmented_coord = (

711

[augmented_coord[0], augmented_coord[3] // channel_divisor]

712

+ augmented_coord[1:3]

713

+ [augmented_coord[3] % channel_divisor]

714

)

715

else:

716

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

717

return None

718

719

return augmented_coord

720

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

721

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

722

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

723

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

724

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

725

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

726

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

727

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

728

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

729

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

730

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

731

assert len(self.compressed_values) > 0

732

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

733

734

depth = coord[-1]

735

brick_depth = self.brick_size[-1]

736

# Clamp position at final element index

737

if depth > self.shape[-1]:

738

depth = self.shape[-1]

739

740

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

741

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

742

743

# Check boundaries on all but last weight set (which may be shorter

744

# than the brick we divided it up into)

745

if index < len(self.weight_compressed_offsets) - 1:

746

# There are no half-way points in the weights

747

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

748

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

752

def size_of_compressed_stream(self, index: int) -> int:

753

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

754

assert 0 <= index < len(self.compressed_values)

755

return len(self.compressed_values[index])

756

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

757

def is_last_index_in_compressed_stream(self, index: int) -> bool:

758

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

759

assert 0 <= index < len(self.compressed_values)

760

return index == len(self.compressed_values) - 1

761

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

762

def address_for_coordinate(

763

self,

764

orig_coord: Shape,

765

strides: Optional[List[int]] = None,

766

op_shape4D: Optional[Shape4D] = None,

767

is_top_box: bool = False,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

768

) -> Optional[int]:

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

769

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

770

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

771

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

772

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

773

# Strides may be passed as an argument, for example when creating feature maps as the strides may be modified

774

# by the "ofm_stride_multiplier" operation attribute. If not, they are calculated here.

775

if not strides:

776

strides = self.get_strides(op_shape4D)

coord = orig_coord

if is_top_box:

coord = [c - 1 for c in orig_coord]

781

address_offset += 1 * strides[-1] # one element

782

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

783

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

784

shape = op_shape4D.as_list() if op_shape4D else self.shape

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

785

for _coord, _shape in zip(coord, shape):

786

assert _coord >= 0 and _coord < _shape

787

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

788

if op_shape4D and self.is_standard_fm:

789

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

790

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

791

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

792

storage_shape = self.storage_shape

793

coord = coord[-len(storage_shape) :]

794

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

795

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

796

# Handle wraparound for partial buffers. Make sure to do this after subtracting top box

797

coord = [_coord % _shape for _coord, _shape in zip(coord, storage_shape)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

798

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

799

augmented_coord = self.get_augmented_coord(coord)

800

assert augmented_coord is not None

801

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

802

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

803

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

804

assert address_offset >= 0 and address_offset <= storage_size

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

805

return self.address + address_offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

806

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

807

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

808

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

809

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

810

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

811

return self.equivalence_id == tens.equivalence_id

812

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

813

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

814

self.shape = shape

815

self.storage_shape = shape

816

self.bandwidth_shape = shape

817

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

818

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

819

d = len(self.shape)

820

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

821

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

822

elif d == 2:

823

return [self.shape[0], 1, 1, self.shape[1]]

824

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

825

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

826

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

827

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

828

# a tensor is quantized if it has an integral type and it contains valid quantization params

829

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

830

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

831

return False

832

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

833

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

834

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

835

def get_scalar(self):

836

"""

837

return: Unquantized or dequantized scalar value

838

rtype: self.dtype (if unquantized) or float (if dequantized)

839

"""

840

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

841

if self.is_quantized():

842

return self.quantization.dequantize(self.values).item(0)

843

else:

844

return self.values.item(0)

845

Ayaan Masood

a2ec5aa

2022-04-21 14:28:03 +0100

[diff] [blame]

846

def get_shape_as_2d(self, dimension_2_size: int) -> Optional[Shape4D]:

847

848

elms = self.elements()

849

dimension_1_size = elms // dimension_2_size

850

# Checks if the reduction works and shape is not 1D

851

is_reducible = dimension_1_size * dimension_2_size == elms and not (len(self.shape) == 1)

new_shape = None

if is_reducible:

new_shape = Shape4D([dimension_1_size, 1, 1, dimension_2_size])

return new_shape

Louis Verhaard

2020-12-17 13:54:09 +0100

[diff] [blame]

859

def __lt__(self, other: "Tensor") -> bool:

860

return self.equivalence_id < other.equivalence_id

861

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

862

def __str__(self):

863

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

864

865

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

866

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

867

def error(self, msg):

868

"""

869

Raises a VelaError exception for errors encountered when parsing a Tensor

870

871

:param self: Tensor object that resulted in the error

872

:param msg: str object that contains a description of the specific error encountered

873

"""

874

875

def _print_operators(ops):

876

lines = []

877

for idx, op in enumerate(ops):

878

op_type = getattr(op, "type", "Not an Operation")

879

op_id = getattr(op, "op_index", "-")

880

lines.append(f" {idx} = {op_type} ({op_id})")

881

return lines

882

883

lines = [f"Invalid {self.name} tensor. {msg}"]

884

885

lines += [" Driving operators:"]

886

lines += _print_operators(self.ops)

887

888

lines += [" Consuming operators:"]

889

lines += _print_operators(self.consumer_list)

890

891

raise VelaError("\n".join(lines))

892

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

893

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

894

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

895

# checks that the scaling of two quantized tensors are equal

896

Tim Hall