Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Rickard Bolin

bc6ee58

2022-11-04 08:24:29 +0000

[diff] [blame^]

16

#

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

17

# Description:

18

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

19

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

21

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

22

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

23

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

24

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

25

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

26

from typing import Dict

27

from typing import List

28

from typing import Optional

29

from typing import Tuple

30

from typing import Union

31

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

36

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

37

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

38

from .errors import UnsupportedFeatureError

39

from .errors import VelaError

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

120

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

121

self.value

122

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

124

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

125

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

126

self.value

127

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

128

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

129

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

130

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

131

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

132

133

134

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

143

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

144

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

145

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

146

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

147

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

148

def all():

149

return (

150

TensorSubPurpose.Standard,

151

TensorSubPurpose.DoubleBuffer,

152

TensorSubPurpose.RollingBufferX,

153

TensorSubPurpose.RollingBufferY,

154

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

159

Unknown = 0

160

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

175

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

195

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

196

new_shp = list(shp)

197

198

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

199

for i in range(-1, -len(shp) - 1, -1):

200

if new_shp[i] is not None:

201

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

205

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

206

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

207

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

211

class QuantizationParameters:

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

__slots__ = (

"min",

"max",

"num_bits",

"narrow_range",

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

217

"next_after",

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

"scale_f32",

"zero_point",

"quant_min",

"quant_max",

"quant_dim",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

224

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

225

def __init__(

226

self,

227

min: Union[float, np.ndarray, None] = None,

228

max: Union[float, np.ndarray, None] = None,

229

num_bits=None,

230

narrow_range=None,

231

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

236

self.narrow_range = narrow_range

237

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

238

# Use the 'next after' float value of scale_f32 when converting to scale and shift. It can be combined with

239

# natural rounding to perform rounding away from zero. This only affects the ofm scale and bias tensor, it has

240

# no affect on global scaling i.e. the ofm_scale register

241

self.next_after = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

242

self.scale_f32: Union[float, np.ndarray, None] = None

243

self.zero_point: Union[int, np.ndarray, None] = None

244

self.quant_min: Optional[float] = None

245

self.quant_max: Optional[float] = None

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

246

self.quant_dim: Optional[int] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

247

248

def __str__(self):

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

249

return (

250

f"<nng.QuantizationParameters min={self.min}, max={self.max}, num_bits={self.num_bits}, "

251

f"scale={self.scale_f32}, zero_point={self.zero_point}, next={self.next_after}>"

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

256

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

257

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

262

res.narrow_range = self.narrow_range

263

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

264

res.next_after = self.next_after

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

265

res.scale_f32 = self.scale_f32

266

res.zero_point = self.zero_point

267

res.quant_min = self.quant_min

268

res.quant_max = self.quant_max

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

269

res.quant_dim = self.quant_dim

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

270

return res

271

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

272

def dequantize(self, values) -> np.ndarray:

273

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

274

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

275

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

276

"""

277

Returns True if the scale and zero point of self and other are equal. If other is None then the scaling is

278

not considered equal because the tensor is assumed to not be quantised and False will be returned

279

"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

280

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

281

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

282

return False

283

284

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

285

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

286

def is_valid(self) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

287

"""Return True if the quantisation parameters have a scale and zero point"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

288

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

289

return self.scale_f32 is not None and self.zero_point is not None

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

290

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

291

def is_per_axis(self) -> bool:

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

292

"""Returns True if either the scale, zero point, minimum or maximum values have more than one value"""

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

293

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

294

for attr in ("scale_f32", "zero_point", "min", "max"):

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

295

if np.size(getattr(self, attr)) > 1:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

299

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

300

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

306

purpose: TensorPurpose = TensorPurpose.Unknown,

307

quantization: QuantizationParameters = None,

308

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

309

# Tensor

310

const_tensor = Tensor(shape, dtype, name + "_0")

311

const_tensor.purpose = purpose

312

const_tensor.quantization = quantization

313

const_tensor.values = np.array(values, dtype=value_dtype)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

314

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

315

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

316

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

317

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

321

# class that keeps track of all tensor addresses in the different memory types

322

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

323

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

324

325

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

326

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

327

return cls.address_map[tens_id].get(mem_type)

328

329

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

330

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

331

# Check previous address if there is one

332

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

333

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

334

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

335

336

# Set tensor's address for memory type

337

cls.address_map[tens_id][mem_type] = address

338

339

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

340

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

341

class Tensor:

342

__slots__ = (

343

"shape",

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

344

"_original_shape",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

349

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

350

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

351

"ops",

352

"consumer_list",

353

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

354

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

355

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

356

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

357

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

363

"storage_compression_scale",

364

"bandwidth_compression_scale",

365

"compression_scale_for_worst_weight_stream",

366

"weight_compression_scales",

367

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

368

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

369

"storage_rounding_quantum",

370

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

371

"quantization",

372

"weight_compressed_offsets",

373

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

374

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

375

"equivalence_id",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

376

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

377

"needs_linear_format",

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

378

"ifm_write_protected",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

379

)

380

AllocationQuantum = 16

381

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

382

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

383

self.shape = shape

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

384

self._original_shape = shape

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

385

self.storage_shape = shape

386

self.bandwidth_shape = shape

387

self.dtype = dtype

388

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

389

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

390

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

391

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

392

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

393

self.ops: List[Operation] = []

394

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

395

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

396

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

397

self.compressed_values: Optional[np.ndarray] = None

398

self.compressed_values_substream_offsets: Optional[List] = None

399

self.mem_area: MemArea = MemArea.Unknown

400

self.mem_type: MemType = MemType.Unknown

401

self.format: TensorFormat = TensorFormat.Unknown

402

self.purpose: TensorPurpose = TensorPurpose.Unknown

403

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

404

self.alignment: int = Tensor.AllocationQuantum

405

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

406

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

407

self.storage_compression_scale: float = 1.0

408

self.bandwidth_compression_scale: float = 1.0

409

self.compression_scale_for_worst_weight_stream: float = 1.0

410

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

411

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

412

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

413

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

414

self.value_id: UUID = uuid.uuid4()

415

self.weight_compressed_offsets: List = []

416

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

417

self.brick_size: Tuple = (1, 1, 1, 1)

418

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

419

420

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

421

self.quantization: Optional[QuantizationParameters] = None

422

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

423

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

424

self.needs_linear_format = True

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

425

self.ifm_write_protected = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

426

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

427

# Reference to parent-tensor if this tensor is a clone

Jonas Ohlsson

845e232

2022-03-01 12:39:55 +0100

[diff] [blame]

428

self.src_tensor: Optional[Tensor] = None

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

429

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

430

@property

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

431

def original_shape(self):

432

return self._original_shape

433

434

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

435

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

436

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

437

438

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

439

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

440

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

441

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

442

@property

443

def is_standard_fm(self) -> bool:

444

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

445

Johan Alfvén

0f2e59f

2022-10-21 11:21:38 +0200

[diff] [blame]

446

@property

447

def is_const(self) -> bool:

448

return self.ops != [] and self.ops[0].type == Op.Const

449

450

@property

451

def is_scalar(self) -> bool:

452

return self.shape == [] and self.elements() == 1

453

454

def is_broadcast(self, ofm) -> bool:

455

return self.shape != ofm.shape

456

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

457

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

458

if self.element_size_bytes == 0:

Diqing Zhong

e3d18b0

2021-11-15 13:53:10 +0100

[diff] [blame]

459

return self.dtype.size_in_bits() // 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

460

return self.element_size_bytes

461

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

462

# Returns a copy, renamed to self.name + suffix

463

# The references to Operators will be empty when returned

464

# Depending on set_unique, the copy is shallow, or deep

465

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

466

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

467

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

468

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

469

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

470

res.storage_shape = list(self.storage_shape)

471

res.bandwidth_shape = list(self.bandwidth_shape)

472

if self.quantization is not None:

473

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

474

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

475

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

476

res.ops = []

477

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

478

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

479

return res

480

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

481

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

482

res = self.clone(suffix="_fast_storage")

483

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

484

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

485

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

486

return res

487

Tim Hall

92cd33b

2022-11-03 12:25:33 +0000

[diff] [blame]

488

def as_1D(self):

489

self.shape = [np.prod(self.shape)]

490

if self.values is not None:

491

self.values = self.values.reshape(self.shape)

492

493

def transpose(self, reorder):

494

self.shape = [self.shape[idx] for idx in reorder]

495

self._original_shape = [self._original_shape[idx] for idx in reorder]

496

if self.values is not None:

497

self.values = self.values.transpose(reorder)

498

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

499

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

500

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

501

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

502

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

503

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

504

self.storage_shape = src_tens.storage_shape

505

self.brick_size = src_tens.brick_size

506

self.weight_compression_scales = src_tens.weight_compression_scales

507

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

508

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

509

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

510

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

511

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

512

self.block_traversal = src_tens.block_traversal

513

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

514

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

515

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

516

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

524

if shape_len > 4:

525

return

Louis Verhaard

04bd3e9

2021-08-19 16:36:32 +0200

[diff] [blame]

526

assert not (self.needs_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

527

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

528

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

529

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

530

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

531

if self.shape is None:

532

return

533

534

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

535

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

536

537

if fmt == TensorFormat.WeightsCompressed:

538

compression_ratio = 5 / 8

539

self.storage_compression_scale = compression_ratio

540

self.bandwidth_compression_scale = compression_ratio

541

self.compression_scale_for_worst_weight_stream = compression_ratio

542

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

543

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

544

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

549

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

550

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

555

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

556

return shape_fully_defined(self.shape)

557

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

558

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

559

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

560

if raw_size == 0:

561

raw_size = 1 # force it to take up space

562

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

563

return rounded_size

564

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

565

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

566

elems = shape_num_elements(op_storage_shape)

567

elems = elems if elems else 0

568

raw_size = elems * self.element_size()

569

if raw_size == 0:

570

raw_size = 1 # force it to take up space

571

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

572

return rounded_size

573

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

574

def storage_shape_for_sub_purpose(

575

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

576

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

577

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

578

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

579

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

580

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

581

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

582

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

583

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

584

if sub_purpose == TensorSubPurpose.RollingBufferX:

585

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

586

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

587

shp[0] = 1

588

shp[2] = min(shp[2], param_a)

589

elif sub_purpose == TensorSubPurpose.RollingBufferY:

590

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

591

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

592

shp[0] = 1

593

shp[1] = min(shp[1], param_a)

594

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

595

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

596

assert param_a is not None

597

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

598

shp[0] = 1

599

shp[2] = min(shp[2], param_a)

600

shp[1] = min(shp[1], param_b)

601

elif sub_purpose == TensorSubPurpose.Standard:

602

pass

603

else:

604

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

605

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

606

return shp

607

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

608

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

609

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

610

self.sub_purpose = sub_purpose

611

if sub_purpose == TensorSubPurpose.DoubleBuffer:

612

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

613

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

614

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

615

elems = shape_num_elements(self.bandwidth_shape)

616

if elems is None:

617

return 0

618

return elems * self.element_size() * self.bandwidth_compression_scale

619

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

620

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

621

return self.consumer_list

622

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

623

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

624

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

625

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

626

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

627

def addresses_for_rolling_buffer(

628

self, start_coord: Shape, end_coord: Shape, strides: List[int], op_shape4D: Shape4D

629

) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

630

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

631

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

632

if self.storage_shape == []:

return (

1,

1,

1,

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

637

[self.address_for_coordinate(start_coord, strides, op_shape4D), 0, 0, 0],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

638

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

639

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

640

if self.is_standard_fm:

641

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

642

else:

643

storage_shape_4D = Shape4D(self.storage_shape)

644

645

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

646

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

647

648

crossing_y = min(crossing_y, end_coord[1])

649

crossing_x = min(crossing_x, end_coord[2])

650

651

box_height0 = crossing_y - start_coord[1]

652

box_width = crossing_x - start_coord[2]

653

Rickard Bolin

9ae3455

2022-06-09 13:07:17 +0000

[diff] [blame]

654

addresses: List = [0] * 4

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

655

addresses[0] = self.address_for_coordinate(start_coord, strides, op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

656

657

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

658

addresses[1] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

659

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

660

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

661

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

662

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

663

addresses[2] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

664

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

665

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

666

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

667

addresses[3] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

668

[start_coord[0], crossing_y, crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

669

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

670

671

return box_height0, box_height0, box_width, addresses

672

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

673

def get_strides(self, shape4D: Optional[Shape4D]) -> List[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

674

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

675

augmented_shape = self.get_augmented_shape(shape4D)

676

assert len(augmented_shape) == 5

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

677

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

678

stride = self.element_size() * self.storage_compression_scale

679

680

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

681

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

682

for i in stride_order:

683

strides[i] = stride

684

stride *= augmented_shape[i]

685

else:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

686

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

687

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

688

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

689

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

690

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

691

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

692

return strides

693

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

694

def get_augmented_shape(self, shape4D: Optional[Shape4D] = None) -> Optional[Shape]:

695

696

if shape4D and self.is_standard_fm:

697

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

698

else:

699

augmented_shape = full_shape(4, self.storage_shape, 1)

700

701

if self.format == TensorFormat.NHWC:

702

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

703

704

elif self.format == TensorFormat.NHCWB16:

705

augmented_shape = augmented_shape[0:4] + [1]

706

707

if augmented_shape[1] == 0:

708

augmented_shape[1] = 1

709

710

else:

711

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

712

return None

713

714

return augmented_shape

715

716

def get_augmented_coord(self, coord: Optional[Shape] = None) -> Optional[Shape]:

717

if coord is None:

718

coord = [0] * min(len(self.storage_shape), 4)

719

720

missing_len = 4 - len(coord)

721

augmented_coord = ([0] * missing_len) + coord

722

723

if self.format == TensorFormat.NHWC:

724

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

725

726

elif self.format == TensorFormat.NHCWB16:

727

channel_divisor = 16

728

augmented_coord = (

729

[augmented_coord[0], augmented_coord[3] // channel_divisor]

730

+ augmented_coord[1:3]

731

+ [augmented_coord[3] % channel_divisor]

732

)

733

else:

734

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

735

return None

736

737

return augmented_coord

738

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

739

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

740

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

741

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

742

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

743

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

744

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

745

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

746

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

747

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

748

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

749

assert len(self.compressed_values) > 0

750

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

751

752

depth = coord[-1]

753

brick_depth = self.brick_size[-1]

754

# Clamp position at final element index

755

if depth > self.shape[-1]:

756

depth = self.shape[-1]

757

758

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

759

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

760

761

# Check boundaries on all but last weight set (which may be shorter

762

# than the brick we divided it up into)

763

if index < len(self.weight_compressed_offsets) - 1:

764

# There are no half-way points in the weights

765

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

766

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

770

def size_of_compressed_stream(self, index: int) -> int:

771

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

772

assert 0 <= index < len(self.compressed_values)

773

return len(self.compressed_values[index])

774

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

775

def is_last_index_in_compressed_stream(self, index: int) -> bool:

776

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

777

assert 0 <= index < len(self.compressed_values)

778

return index == len(self.compressed_values) - 1

779

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

780

def address_for_coordinate(

781

self,

782

orig_coord: Shape,

783

strides: Optional[List[int]] = None,

784

op_shape4D: Optional[Shape4D] = None,

785

is_top_box: bool = False,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

786

) -> Optional[int]:

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

787

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

788

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

789

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

790

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

791

# Strides may be passed as an argument, for example when creating feature maps as the strides may be modified

792

# by the "ofm_stride_multiplier" operation attribute. If not, they are calculated here.

793

if not strides:

794

strides = self.get_strides(op_shape4D)

coord = orig_coord

if is_top_box:

coord = [c - 1 for c in orig_coord]

799

address_offset += 1 * strides[-1] # one element

800

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

801

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

802

shape = op_shape4D.as_list() if op_shape4D else self.shape

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

803

for _coord, _shape in zip(coord, shape):

804

assert _coord >= 0 and _coord < _shape

805

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

806

if op_shape4D and self.is_standard_fm:

807

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

808

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

809

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

810

storage_shape = self.storage_shape

811

coord = coord[-len(storage_shape) :]

812

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

813

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

814

# Handle wraparound for partial buffers. Make sure to do this after subtracting top box

815

coord = [_coord % _shape for _coord, _shape in zip(coord, storage_shape)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

816

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

817

augmented_coord = self.get_augmented_coord(coord)

818

assert augmented_coord is not None

819

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

820

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

821

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

822

assert address_offset >= 0 and address_offset <= storage_size

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

823

return self.address + address_offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

824

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

825

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

826

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

827

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

828

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

829

return self.equivalence_id == tens.equivalence_id

830

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

831

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

832

self.shape = shape

833

self.storage_shape = shape

834

self.bandwidth_shape = shape

835

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

836

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

837

d = len(self.shape)

838

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

839

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

840

elif d == 2:

841

return [self.shape[0], 1, 1, self.shape[1]]

842

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

843

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

844

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

845

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

846

# a tensor is quantized if it has an integral type and it contains valid quantization params

847

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

848

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

849

return False

850

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

851

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

852

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

853

def get_scalar(self):

854

"""

855

return: Unquantized or dequantized scalar value

856

rtype: self.dtype (if unquantized) or float (if dequantized)

857

"""

858

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

859

if self.is_quantized():

860

return self.quantization.dequantize(self.values).item(0)

861

else:

862

return self.values.item(0)

863

Ayaan Masood

a2ec5aa

2022-04-21 14:28:03 +0100

[diff] [blame]

864

def get_shape_as_2d(self, dimension_2_size: int) -> Optional[Shape4D]:

865

866

elms = self.elements()

867

dimension_1_size = elms // dimension_2_size

868

# Checks if the reduction works and shape is not 1D

869

is_reducible = dimension_1_size * dimension_2_size == elms and not (len(self.shape) == 1)

new_shape = None

if is_reducible:

new_shape = Shape4D([dimension_1_size, 1, 1, dimension_2_size])

return new_shape

Louis Verhaard

2020-12-17 13:54:09 +0100

[diff] [blame]

877

def __lt__(self, other: "Tensor") -> bool:

878

return self.equivalence_id < other.equivalence_id

879

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

880

def __str__(self):

881

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

882

883

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

884

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

885

def error(self, msg):

886

"""

887

Raises a VelaError exception for errors encountered when parsing a Tensor

888

889

:param self: Tensor object that resulted in the error

890

:param msg: str object that contains a description of the specific error encountered

891

"""

892

893

def _print_operators(ops):

894

lines = []

895

for idx, op in enumerate(ops):

896

op_type = getattr(op, "type", "Not an Operation")

897

op_id = getattr(op, "op_index", "-")

898

lines.append(f" {idx} = {op_type} ({op_id})")

899

return lines

900

901

lines = [f"Invalid {self.name} tensor. {msg}"]

902

903

lines += [" Driving operators:"]

904

lines += _print_operators(self.ops)

905

906

lines += [" Consuming operators:"]

907

lines += _print_operators(self.consumer_list)

908

909

raise VelaError("\n".join(lines))

910

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

911

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

912

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

913

# checks that the scaling of two quantized tensors are equal

914

Tim Hall