Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2022-07-04 16:19:16 +0000

[diff] [blame]

1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

39

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

40

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

41

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

42

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

43

44

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

45

46

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

47

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

54

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

55

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

56

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

57

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

58

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

59

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

60

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

61

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

62

def all():

63

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

69

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

75

return self.name

76

77

def identifier_name(self):

78

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

83

84

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

85

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

91

Shram = 5 # for LUT

92

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

93

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

94

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

95

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

96

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

97

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

98

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

99

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

100

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

101

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

102

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

117

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

118

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

119

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

120

self.value

121

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

122

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

123

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

124

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

125

self.value

126

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

127

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

128

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

129

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

130

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

131

132

133

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

140

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

141

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

142

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

143

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

144

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

145

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

146

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

147

def all():

148

return (

149

TensorSubPurpose.Standard,

150

TensorSubPurpose.DoubleBuffer,

151

TensorSubPurpose.RollingBufferX,

152

TensorSubPurpose.RollingBufferY,

153

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

158

Unknown = 0

159

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

174

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

185

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

194

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

195

new_shp = list(shp)

196

197

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

198

for i in range(-1, -len(shp) - 1, -1):

199

if new_shp[i] is not None:

200

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

204

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

205

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

206

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

210

class QuantizationParameters:

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

__slots__ = (

"min",

"max",

"num_bits",

"narrow_range",

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

216

"next_after",

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

"scale_f32",

"zero_point",

"quant_min",

"quant_max",

"quant_dim",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

223

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

224

def __init__(

225

self,

226

min: Union[float, np.ndarray, None] = None,

227

max: Union[float, np.ndarray, None] = None,

228

num_bits=None,

229

narrow_range=None,

230

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

235

self.narrow_range = narrow_range

236

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

237

# Use the 'next after' float value of scale_f32 when converting to scale and shift. It can be combined with

238

# natural rounding to perform rounding away from zero. This only affects the ofm scale and bias tensor, it has

239

# no affect on global scaling i.e. the ofm_scale register

240

self.next_after = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

241

self.scale_f32: Union[float, np.ndarray, None] = None

242

self.zero_point: Union[int, np.ndarray, None] = None

243

self.quant_min: Optional[float] = None

244

self.quant_max: Optional[float] = None

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

245

self.quant_dim: Optional[int] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

246

247

def __str__(self):

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

248

return (

249

f"<nng.QuantizationParameters min={self.min}, max={self.max}, num_bits={self.num_bits}, "

250

f"scale={self.scale_f32}, zero_point={self.zero_point}, next={self.next_after}>"

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

255

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

256

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

261

res.narrow_range = self.narrow_range

262

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

263

res.next_after = self.next_after

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

264

res.scale_f32 = self.scale_f32

265

res.zero_point = self.zero_point

266

res.quant_min = self.quant_min

267

res.quant_max = self.quant_max

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

268

res.quant_dim = self.quant_dim

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

269

return res

270

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

271

def dequantize(self, values) -> np.ndarray:

272

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

273

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

274

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

275

"""

276

Returns True if the scale and zero point of self and other are equal. If other is None then the scaling is

277

not considered equal because the tensor is assumed to not be quantised and False will be returned

278

"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

279

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

280

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

281

return False

282

283

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

284

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

285

def is_valid(self) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

286

"""Return True if the quantisation parameters have a scale and zero point"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

287

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

288

return self.scale_f32 is not None and self.zero_point is not None

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

289

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

290

def is_per_axis(self) -> bool:

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

291

"""Returns True if either the scale, zero point, minimum or maximum values have more than one value"""

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

292

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

293

for attr in ("scale_f32", "zero_point", "min", "max"):

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

294

if np.size(getattr(self, attr)) > 1:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

298

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

299

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

305

purpose: TensorPurpose = TensorPurpose.Unknown,

306

quantization: QuantizationParameters = None,

307

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

308

# Tensor

309

const_tensor = Tensor(shape, dtype, name + "_0")

310

const_tensor.purpose = purpose

311

const_tensor.quantization = quantization

312

const_tensor.values = np.array(values, dtype=value_dtype)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

313

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

314

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

315

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

316

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

320

# class that keeps track of all tensor addresses in the different memory types

321

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

322

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

323

324

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

325

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

326

return cls.address_map[tens_id].get(mem_type)

327

328

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

329

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

330

# Check previous address if there is one

331

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

332

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

333

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

334

335

# Set tensor's address for memory type

336

cls.address_map[tens_id][mem_type] = address

337

338

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

339

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

340

class Tensor:

341

__slots__ = (

342

"shape",

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

343

"_original_shape",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

348

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

349

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

350

"ops",

351

"consumer_list",

352

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

353

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

354

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

355

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

356

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

362

"storage_compression_scale",

363

"bandwidth_compression_scale",

364

"compression_scale_for_worst_weight_stream",

365

"weight_compression_scales",

366

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

367

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

368

"storage_rounding_quantum",

369

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

370

"quantization",

371

"weight_compressed_offsets",

372

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

374

"equivalence_id",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

375

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

376

"needs_linear_format",

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

377

"ifm_write_protected",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

378

)

379

AllocationQuantum = 16

380

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

381

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

382

self.shape = shape

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

383

self._original_shape = shape

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

384

self.storage_shape = shape

385

self.bandwidth_shape = shape

386

self.dtype = dtype

387

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

388

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

389

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

390

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

391

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

392

self.ops: List[Operation] = []

393

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

394

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

395

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

396

self.compressed_values: Optional[np.ndarray] = None

397

self.compressed_values_substream_offsets: Optional[List] = None

398

self.mem_area: MemArea = MemArea.Unknown

399

self.mem_type: MemType = MemType.Unknown

400

self.format: TensorFormat = TensorFormat.Unknown

401

self.purpose: TensorPurpose = TensorPurpose.Unknown

402

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

403

self.alignment: int = Tensor.AllocationQuantum

404

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

406

self.storage_compression_scale: float = 1.0

407

self.bandwidth_compression_scale: float = 1.0

408

self.compression_scale_for_worst_weight_stream: float = 1.0

409

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

410

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

411

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

412

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

413

self.value_id: UUID = uuid.uuid4()

414

self.weight_compressed_offsets: List = []

415

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

416

self.brick_size: Tuple = (1, 1, 1, 1)

417

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

418

419

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

420

self.quantization: Optional[QuantizationParameters] = None

421

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

422

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

423

self.needs_linear_format = True

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

424

self.ifm_write_protected = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

425

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

426

# Reference to parent-tensor if this tensor is a clone

Jonas Ohlsson

845e232

2022-03-01 12:39:55 +0100

[diff] [blame]

427

self.src_tensor: Optional[Tensor] = None

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

428

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

429

@property

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

430

def original_shape(self):

431

return self._original_shape

432

433

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

434

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

435

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

436

437

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

438

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

439

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

440

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

441

@property

442

def is_standard_fm(self) -> bool:

443

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

444

Johan Alfvén

0f2e59f

2022-10-21 11:21:38 +0200

[diff] [blame]

445

@property

446

def is_const(self) -> bool:

447

return self.ops != [] and self.ops[0].type == Op.Const

448

449

@property

450

def is_scalar(self) -> bool:

451

return self.shape == [] and self.elements() == 1

452

453

def is_broadcast(self, ofm) -> bool:

454

return self.shape != ofm.shape

455

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

456

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

457

if self.element_size_bytes == 0:

Diqing Zhong

e3d18b0

2021-11-15 13:53:10 +0100

[diff] [blame]

458

return self.dtype.size_in_bits() // 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

459

return self.element_size_bytes

460

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

461

# Returns a copy, renamed to self.name + suffix

462

# The references to Operators will be empty when returned

463

# Depending on set_unique, the copy is shallow, or deep

464

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

465

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

466

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

467

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

468

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

469

res.storage_shape = list(self.storage_shape)

470

res.bandwidth_shape = list(self.bandwidth_shape)

471

if self.quantization is not None:

472

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

473

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

474

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

475

res.ops = []

476

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

477

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

478

return res

479

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

480

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

481

res = self.clone(suffix="_fast_storage")

482

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

483

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

484

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

485

return res

486

Tim Hall

92cd33b

2022-11-03 12:25:33 +0000

[diff] [blame]

487

def as_1D(self):

488

self.shape = [np.prod(self.shape)]

489

if self.values is not None:

490

self.values = self.values.reshape(self.shape)

491

492

def transpose(self, reorder):

493

self.shape = [self.shape[idx] for idx in reorder]

494

self._original_shape = [self._original_shape[idx] for idx in reorder]

495

if self.values is not None:

496

self.values = self.values.transpose(reorder)

497

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

498

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

499

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

500

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

501

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

502

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

503

self.storage_shape = src_tens.storage_shape

504

self.brick_size = src_tens.brick_size

505

self.weight_compression_scales = src_tens.weight_compression_scales

506

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

507

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

508

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

509

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

510

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

511

self.block_traversal = src_tens.block_traversal

512

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

513

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

514

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

515

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

523

if shape_len > 4:

524

return

Louis Verhaard

04bd3e9

2021-08-19 16:36:32 +0200

[diff] [blame]

525

assert not (self.needs_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

526

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

527

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

528

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

529

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

530

if self.shape is None:

531

return

532

533

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

534

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

535

536

if fmt == TensorFormat.WeightsCompressed:

537

compression_ratio = 5 / 8

538

self.storage_compression_scale = compression_ratio

539

self.bandwidth_compression_scale = compression_ratio

540

self.compression_scale_for_worst_weight_stream = compression_ratio

541

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

542

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

543

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

548

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

549

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

554

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

555

return shape_fully_defined(self.shape)

556

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

557

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

558

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

559

if raw_size == 0:

560

raw_size = 1 # force it to take up space

561

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

562

return rounded_size

563

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

564

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

565

elems = shape_num_elements(op_storage_shape)

566

elems = elems if elems else 0

567

raw_size = elems * self.element_size()

568

if raw_size == 0:

569

raw_size = 1 # force it to take up space

570

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

571

return rounded_size

572

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

573

def storage_shape_for_sub_purpose(

574

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

575

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

576

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

577

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

578

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

579

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

580

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

581

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

582

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

583

if sub_purpose == TensorSubPurpose.RollingBufferX:

584

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

585

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

586

shp[0] = 1

587

shp[2] = min(shp[2], param_a)

588

elif sub_purpose == TensorSubPurpose.RollingBufferY:

589

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

590

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

591

shp[0] = 1

592

shp[1] = min(shp[1], param_a)

593

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

594

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

595

assert param_a is not None

596

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

597

shp[0] = 1

598

shp[2] = min(shp[2], param_a)

599

shp[1] = min(shp[1], param_b)

600

elif sub_purpose == TensorSubPurpose.Standard:

601

pass

602

else:

603

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

604

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

605

return shp

606

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

607

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

608

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

609

self.sub_purpose = sub_purpose

610

if sub_purpose == TensorSubPurpose.DoubleBuffer:

611

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

612

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

613

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

614

elems = shape_num_elements(self.bandwidth_shape)

615

if elems is None:

616

return 0

617

return elems * self.element_size() * self.bandwidth_compression_scale

618

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

619

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

620

return self.consumer_list

621

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

622

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

623

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

624

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

625

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

626

def addresses_for_rolling_buffer(

627

self, start_coord: Shape, end_coord: Shape, strides: List[int], op_shape4D: Shape4D

628

) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

629

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

630

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

631

if self.storage_shape == []:

return (

1,

1,

1,

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

636

[self.address_for_coordinate(start_coord, strides, op_shape4D), 0, 0, 0],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

637

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

638

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

639

if self.is_standard_fm:

640

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

641

else:

642

storage_shape_4D = Shape4D(self.storage_shape)

643

644

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

645

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

646

647

crossing_y = min(crossing_y, end_coord[1])

648

crossing_x = min(crossing_x, end_coord[2])

649

650

box_height0 = crossing_y - start_coord[1]

651

box_width = crossing_x - start_coord[2]

652

Rickard Bolin

9ae3455

2022-06-09 13:07:17 +0000

[diff] [blame]

653

addresses: List = [0] * 4

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

654

addresses[0] = self.address_for_coordinate(start_coord, strides, op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

655

656

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

657

addresses[1] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

658

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

659

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

660

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

661

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

662

addresses[2] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

663

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

664

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

665

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

666

addresses[3] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

667

[start_coord[0], crossing_y, crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

668

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

669

670

return box_height0, box_height0, box_width, addresses

671

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

672

def get_strides(self, shape4D: Optional[Shape4D]) -> List[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

673

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

674

augmented_shape = self.get_augmented_shape(shape4D)

675

assert len(augmented_shape) == 5

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

676

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

677

stride = self.element_size() * self.storage_compression_scale

678

679

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

680

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

681

for i in stride_order:

682

strides[i] = stride

683

stride *= augmented_shape[i]

684

else:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

685

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

686

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

687

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

688

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

689

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

690

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

691

return strides

692

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

693

def get_augmented_shape(self, shape4D: Optional[Shape4D] = None) -> Optional[Shape]:

694

695

if shape4D and self.is_standard_fm:

696

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

697

else:

698

augmented_shape = full_shape(4, self.storage_shape, 1)

699

700

if self.format == TensorFormat.NHWC:

701

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

702

703

elif self.format == TensorFormat.NHCWB16:

704

augmented_shape = augmented_shape[0:4] + [1]

705

706

if augmented_shape[1] == 0:

707

augmented_shape[1] = 1

708

709

else:

710

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

711

return None

712

713

return augmented_shape

714

715

def get_augmented_coord(self, coord: Optional[Shape] = None) -> Optional[Shape]:

716

if coord is None:

717

coord = [0] * min(len(self.storage_shape), 4)

718

719

missing_len = 4 - len(coord)

720

augmented_coord = ([0] * missing_len) + coord

721

722

if self.format == TensorFormat.NHWC:

723

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

724

725

elif self.format == TensorFormat.NHCWB16:

726

channel_divisor = 16

727

augmented_coord = (

728

[augmented_coord[0], augmented_coord[3] // channel_divisor]

729

+ augmented_coord[1:3]

730

+ [augmented_coord[3] % channel_divisor]

731

)

732

else:

733

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

734

return None

735

736

return augmented_coord

737

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

738

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

739

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

740

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

741

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

742

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

743

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

744

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

745

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

746

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

747

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

748

assert len(self.compressed_values) > 0

749

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

750

751

depth = coord[-1]

752

brick_depth = self.brick_size[-1]

753

# Clamp position at final element index

754

if depth > self.shape[-1]:

755

depth = self.shape[-1]

756

757

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

758

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

759

760

# Check boundaries on all but last weight set (which may be shorter

761

# than the brick we divided it up into)

762

if index < len(self.weight_compressed_offsets) - 1:

763

# There are no half-way points in the weights

764

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

765

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

769

def size_of_compressed_stream(self, index: int) -> int:

770

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

771

assert 0 <= index < len(self.compressed_values)

772

return len(self.compressed_values[index])

773

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

774

def is_last_index_in_compressed_stream(self, index: int) -> bool:

775

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

776

assert 0 <= index < len(self.compressed_values)

777

return index == len(self.compressed_values) - 1

778

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

779

def address_for_coordinate(

780

self,

781

orig_coord: Shape,

782

strides: Optional[List[int]] = None,

783

op_shape4D: Optional[Shape4D] = None,

784

is_top_box: bool = False,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

785

) -> Optional[int]:

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

786

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

787

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

788

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

789

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

790

# Strides may be passed as an argument, for example when creating feature maps as the strides may be modified

791

# by the "ofm_stride_multiplier" operation attribute. If not, they are calculated here.

792

if not strides:

793

strides = self.get_strides(op_shape4D)

coord = orig_coord

if is_top_box:

coord = [c - 1 for c in orig_coord]

798

address_offset += 1 * strides[-1] # one element

799

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

800

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

801

shape = op_shape4D.as_list() if op_shape4D else self.shape

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

802

for _coord, _shape in zip(coord, shape):

803

assert _coord >= 0 and _coord < _shape

804

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

805

if op_shape4D and self.is_standard_fm:

806

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

807

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

808

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

809

storage_shape = self.storage_shape

810

coord = coord[-len(storage_shape) :]

811

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

812

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

813

# Handle wraparound for partial buffers. Make sure to do this after subtracting top box

814

coord = [_coord % _shape for _coord, _shape in zip(coord, storage_shape)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

815

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

816

augmented_coord = self.get_augmented_coord(coord)

817

assert augmented_coord is not None

818

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

819

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

820

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

821

assert address_offset >= 0 and address_offset <= storage_size

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

822

return self.address + address_offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

823

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

824

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

825

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

826

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

827

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

828

return self.equivalence_id == tens.equivalence_id

829

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

830

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

831

self.shape = shape

832

self.storage_shape = shape

833

self.bandwidth_shape = shape

834

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

835

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

836

d = len(self.shape)

837

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

838

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

839

elif d == 2:

840

return [self.shape[0], 1, 1, self.shape[1]]

841

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

842

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

843

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

844

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

845

# a tensor is quantized if it has an integral type and it contains valid quantization params

846

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

847

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

848

return False

849

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

850

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

851

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

852

def get_scalar(self):

853

"""

854

return: Unquantized or dequantized scalar value

855

rtype: self.dtype (if unquantized) or float (if dequantized)

856

"""

857

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

858

if self.is_quantized():

859

return self.quantization.dequantize(self.values).item(0)

860

else:

861

return self.values.item(0)

862

Ayaan Masood

a2ec5aa

2022-04-21 14:28:03 +0100

[diff] [blame]

863

def get_shape_as_2d(self, dimension_2_size: int) -> Optional[Shape4D]:

864

865

elms = self.elements()

866

dimension_1_size = elms // dimension_2_size

867

# Checks if the reduction works and shape is not 1D

868

is_reducible = dimension_1_size * dimension_2_size == elms and not (len(self.shape) == 1)

new_shape = None

if is_reducible:

new_shape = Shape4D([dimension_1_size, 1, 1, dimension_2_size])

return new_shape

Louis Verhaard

2020-12-17 13:54:09 +0100

[diff] [blame]

876

def __lt__(self, other: "Tensor") -> bool:

877

return self.equivalence_id < other.equivalence_id

878

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

879

def __str__(self):

880

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

881

882

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

883

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

884

def error(self, msg):

885

"""

886

Raises a VelaError exception for errors encountered when parsing a Tensor

887

888

:param self: Tensor object that resulted in the error

889

:param msg: str object that contains a description of the specific error encountered

890

"""

891

892

def _print_operators(ops):

893

lines = []

894

for idx, op in enumerate(ops):

895

op_type = getattr(op, "type", "Not an Operation")

896

op_id = getattr(op, "op_index", "-")

897

lines.append(f" {idx} = {op_type} ({op_id})")

898

return lines

899

900

lines = [f"Invalid {self.name} tensor. {msg}"]

901

902

lines += [" Driving operators:"]

903

lines += _print_operators(self.ops)

904

905

lines += [" Consuming operators:"]

906

lines += _print_operators(self.consumer_list)

907

908

raise VelaError("\n".join(lines))

909

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

910

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

911

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

912

# checks that the scaling of two quantized tensors are equal

913

Tim Hall