Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

39

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

40

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

41

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

42

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

43

44

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

45

46

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

47

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

54

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

55

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

56

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

57

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

58

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

59

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

60

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

61

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

62

def all():

63

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

69

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

75

return self.name

76

77

def identifier_name(self):

78

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

83

84

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

85

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

91

Shram = 5 # for LUT

92

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

93

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

94

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

95

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

96

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

97

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

98

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

99

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

100

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

101

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

102

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

117

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

118

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

119

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

120

self.value

121

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

122

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

123

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

124

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

125

self.value

126

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

127

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

128

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

129

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

130

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

131

132

133

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

140

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

141

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

142

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

143

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

144

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

145

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

146

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

147

def all():

148

return (

149

TensorSubPurpose.Standard,

150

TensorSubPurpose.DoubleBuffer,

151

TensorSubPurpose.RollingBufferX,

152

TensorSubPurpose.RollingBufferY,

153

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

158

Unknown = 0

159

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

174

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

185

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

194

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

195

new_shp = list(shp)

196

197

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

198

for i in range(-1, -len(shp) - 1, -1):

199

if new_shp[i] is not None:

200

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

204

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

205

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

206

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

210

class QuantizationParameters:

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

__slots__ = (

"min",

"max",

"num_bits",

"narrow_range",

"scale_f32",

"zero_point",

"quant_min",

"quant_max",

"quant_dim",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

222

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

223

def __init__(

224

self,

225

min: Union[float, np.ndarray, None] = None,

226

max: Union[float, np.ndarray, None] = None,

227

num_bits=None,

228

narrow_range=None,

229

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

234

self.narrow_range = narrow_range

235

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

236

self.scale_f32: Union[float, np.ndarray, None] = None

237

self.zero_point: Union[int, np.ndarray, None] = None

238

self.quant_min: Optional[float] = None

239

self.quant_max: Optional[float] = None

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

240

self.quant_dim: Optional[int] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

241

242

def __str__(self):

243

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

253

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

254

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

259

res.narrow_range = self.narrow_range

260

261

res.scale_f32 = self.scale_f32

262

res.zero_point = self.zero_point

263

res.quant_min = self.quant_min

264

res.quant_max = self.quant_max

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

265

res.quant_dim = self.quant_dim

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

266

return res

267

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

268

def dequantize(self, values) -> np.ndarray:

269

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

270

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

271

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

272

# quantisation parameter scaling is not equal if 'other' is None because

273

# it implies that the tensor it belongs to is not quantised. otherwise,

274

# it depends upon whether the scale and zero point are equal

275

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

276

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

277

return False

278

279

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

280

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

281

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

282

# quantisation parameters are consider valid if they have a scale and zero point

283

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

284

return self.scale_f32 is not None and self.zero_point is not None

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

285

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

286

def is_per_axis(self) -> bool:

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

287

"""Returns True if either the scale, zero point, minimum or maximum values have more than one value"""

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

288

for attr in ("scale_f32", "zero_point", "min", "max"):

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

289

if np.size(getattr(self, attr)) > 1:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

293

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

294

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

300

purpose: TensorPurpose = TensorPurpose.Unknown,

301

quantization: QuantizationParameters = None,

302

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

303

# Tensor

304

const_tensor = Tensor(shape, dtype, name + "_0")

305

const_tensor.purpose = purpose

306

const_tensor.quantization = quantization

307

const_tensor.values = np.array(values, dtype=value_dtype)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

308

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

309

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

310

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

311

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

315

# class that keeps track of all tensor addresses in the different memory types

316

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

317

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

318

319

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

320

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

321

return cls.address_map[tens_id].get(mem_type)

322

323

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

324

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

325

# Check previous address if there is one

326

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

327

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

328

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

329

330

# Set tensor's address for memory type

331

cls.address_map[tens_id][mem_type] = address

332

333

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

334

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

342

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

343

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

344

"ops",

345

"consumer_list",

346

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

347

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

348

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

349

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

350

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

356

"storage_compression_scale",

357

"bandwidth_compression_scale",

358

"compression_scale_for_worst_weight_stream",

359

"weight_compression_scales",

360

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

361

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

362

"storage_rounding_quantum",

363

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

364

"quantization",

365

"weight_compressed_offsets",

366

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

367

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

368

"equivalence_id",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

369

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

370

"needs_linear_format",

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

371

"ifm_write_protected",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

372

)

373

AllocationQuantum = 16

374

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

375

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

376

self.shape = shape

377

self.storage_shape = shape

378

self.bandwidth_shape = shape

379

self.dtype = dtype

380

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

381

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

382

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

383

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

384

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

385

self.ops: List[Operation] = []

386

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

387

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

388

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

389

self.compressed_values: Optional[np.ndarray] = None

390

self.compressed_values_substream_offsets: Optional[List] = None

391

self.mem_area: MemArea = MemArea.Unknown

392

self.mem_type: MemType = MemType.Unknown

393

self.format: TensorFormat = TensorFormat.Unknown

394

self.purpose: TensorPurpose = TensorPurpose.Unknown

395

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

396

self.alignment: int = Tensor.AllocationQuantum

397

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

398

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

399

self.storage_compression_scale: float = 1.0

400

self.bandwidth_compression_scale: float = 1.0

401

self.compression_scale_for_worst_weight_stream: float = 1.0

402

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

403

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

404

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

405

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

406

self.value_id: UUID = uuid.uuid4()

407

self.weight_compressed_offsets: List = []

408

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

409

self.brick_size: Tuple = (1, 1, 1, 1)

410

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

411

412

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

413

self.quantization: Optional[QuantizationParameters] = None

414

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

415

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

416

self.needs_linear_format = True

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

417

self.ifm_write_protected = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

418

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

419

# Reference to parent-tensor if this tensor is a clone

Jonas Ohlsson

845e232

2022-03-01 12:39:55 +0100

[diff] [blame]

420

self.src_tensor: Optional[Tensor] = None

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

421

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

422

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

423

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

424

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

425

426

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

427

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

428

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

429

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

430

@property

431

def is_standard_fm(self) -> bool:

432

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

433

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

434

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

435

if self.element_size_bytes == 0:

Diqing Zhong

e3d18b0

2021-11-15 13:53:10 +0100

[diff] [blame]

436

return self.dtype.size_in_bits() // 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

437

return self.element_size_bytes

438

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

439

# Returns a copy, renamed to self.name + suffix

440

# The references to Operators will be empty when returned

441

# Depending on set_unique, the copy is shallow, or deep

442

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

443

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

444

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

445

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

446

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

447

res.storage_shape = list(self.storage_shape)

448

res.bandwidth_shape = list(self.bandwidth_shape)

449

if self.quantization is not None:

450

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

451

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

452

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

453

res.ops = []

454

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

455

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

456

return res

457

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

458

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

459

res = self.clone(suffix="_fast_storage")

460

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

461

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

462

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

463

return res

464

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

465

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

466

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

467

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

468

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

469

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

470

self.storage_shape = src_tens.storage_shape

471

self.brick_size = src_tens.brick_size

472

self.weight_compression_scales = src_tens.weight_compression_scales

473

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

474

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

475

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

476

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

477

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

478

self.block_traversal = src_tens.block_traversal

479

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

480

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

481

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

482

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

490

if shape_len > 4:

491

return

Louis Verhaard

04bd3e9

2021-08-19 16:36:32 +0200

[diff] [blame]

492

assert not (self.needs_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

493

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

494

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

495

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

496

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

497

if self.shape is None:

498

return

499

500

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

501

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

502

503

if fmt == TensorFormat.WeightsCompressed:

504

compression_ratio = 5 / 8

505

self.storage_compression_scale = compression_ratio

506

self.bandwidth_compression_scale = compression_ratio

507

self.compression_scale_for_worst_weight_stream = compression_ratio

508

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

509

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

510

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

515

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

516

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

521

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

522

return shape_fully_defined(self.shape)

523

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

524

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

525

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

526

if raw_size == 0:

527

raw_size = 1 # force it to take up space

528

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

529

return rounded_size

530

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

531

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

532

elems = shape_num_elements(op_storage_shape)

533

elems = elems if elems else 0

534

raw_size = elems * self.element_size()

535

if raw_size == 0:

536

raw_size = 1 # force it to take up space

537

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

538

return rounded_size

539

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

540

def storage_shape_for_sub_purpose(

541

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

542

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

543

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

544

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

545

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

546

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

547

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

548

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

549

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

550

if sub_purpose == TensorSubPurpose.RollingBufferX:

551

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

552

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

553

shp[0] = 1

554

shp[2] = min(shp[2], param_a)

555

elif sub_purpose == TensorSubPurpose.RollingBufferY:

556

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

557

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

558

shp[0] = 1

559

shp[1] = min(shp[1], param_a)

560

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

561

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

562

assert param_a is not None

563

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

564

shp[0] = 1

565

shp[2] = min(shp[2], param_a)

566

shp[1] = min(shp[1], param_b)

567

elif sub_purpose == TensorSubPurpose.Standard:

568

pass

569

else:

570

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

571

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

572

return shp

573

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

574

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

575

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

576

self.sub_purpose = sub_purpose

577

if sub_purpose == TensorSubPurpose.DoubleBuffer:

578

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

579

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

580

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

581

elems = shape_num_elements(self.bandwidth_shape)

582

if elems is None:

583

return 0

584

return elems * self.element_size() * self.bandwidth_compression_scale

585

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

586

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

587

return self.consumer_list

588

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

589

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

590

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

591

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

592

593

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, op_shape4D: Shape4D) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

594

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

595

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

596

if self.storage_shape == []:

return (

1,

1,

1,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

601

[self.address_for_coordinate(start_coord, op_shape4D=op_shape4D), None, None, None],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

602

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

603

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

604

if self.is_standard_fm:

605

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

606

else:

607

storage_shape_4D = Shape4D(self.storage_shape)

608

609

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

610

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

611

612

crossing_y = min(crossing_y, end_coord[1])

613

crossing_x = min(crossing_x, end_coord[2])

614

615

box_height0 = crossing_y - start_coord[1]

616

box_width = crossing_x - start_coord[2]

617

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

618

addresses: List = [None] * 4

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

619

addresses[0] = self.address_for_coordinate(start_coord, op_shape4D=op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

620

621

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

622

addresses[1] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

623

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

624

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

625

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

626

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

627

addresses[2] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

628

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

629

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

630

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

631

addresses[3] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

632

[start_coord[0], crossing_y, crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

633

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

634

635

return box_height0, box_height0, box_width, addresses

636

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

637

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, op_shape4D: Shape4D = None) -> int:

638

offset = self.address_offset_for_coordinate(coord, op_shape4D=op_shape4D, is_top_box=is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

639

assert offset is not None

640

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

641

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

642

def get_strides_and_coord(

643

self, coord: Optional[Shape] = None, shape4D: Optional[Shape4D] = None

644

) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

645

if coord is None:

Patrik Gustavsson

46408a8

2021-09-20 10:47:47 +0200

[diff] [blame]

646

coord = [0] * min(len(self.storage_shape), 4)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

647

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

648

if shape4D and self.is_standard_fm:

649

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

650

else:

651

augmented_shape = full_shape(4, self.storage_shape, 1)

652

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

653

augmented_coord = coord

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

654

655

while len(augmented_coord) < 4:

656

augmented_coord = [0] + augmented_coord

657

658

assert len(augmented_coord) == len(augmented_shape)

659

660

if self.format == TensorFormat.NHWC:

661

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

662

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

663

664

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

665

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

666

augmented_shape = augmented_shape[0:4] + [1]

667

augmented_coord = (

668

[augmented_coord[0], augmented_coord[3] // channel_divisor]

669

+ augmented_coord[1:3]

670

+ [augmented_coord[3] % channel_divisor]

671

)

672

673

if augmented_shape[1] == 0:

674

augmented_shape[1] = 1

675

676

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

677

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

678

return None, None

679

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

680

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

681

stride = self.element_size() * self.storage_compression_scale

682

683

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

684

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

685

for i in stride_order:

686

strides[i] = stride

687

stride *= augmented_shape[i]

688

else:

689

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

690

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

691

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

692

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

693

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

694

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

695

696

return strides, augmented_coord

697

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

698

def get_strides(self, shape4D: Optional[Shape4D] = None) -> Shape:

699

strides, _ = self.get_strides_and_coord(shape4D=shape4D)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

700

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

701

return strides

702

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

703

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

704

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

705

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

706

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

707

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

708

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

709

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

710

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

711

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

712

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

713

assert len(self.compressed_values) > 0

714

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

715

716

depth = coord[-1]

717

brick_depth = self.brick_size[-1]

718

# Clamp position at final element index

719

if depth > self.shape[-1]:

720

depth = self.shape[-1]

721

722

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

723

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

724

725

# Check boundaries on all but last weight set (which may be shorter

726

# than the brick we divided it up into)

727

if index < len(self.weight_compressed_offsets) - 1:

728

# There are no half-way points in the weights

729

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

730

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

734

def size_of_compressed_stream(self, index: int) -> int:

735

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

736

assert 0 <= index < len(self.compressed_values)

737

return len(self.compressed_values[index])

738

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

739

def is_last_index_in_compressed_stream(self, index: int) -> bool:

740

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

741

assert 0 <= index < len(self.compressed_values)

742

return index == len(self.compressed_values) - 1

743

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

744

def address_offset_for_coordinate(

745

self, orig_coord: Shape, op_shape4D: Optional[Shape4D] = None, is_top_box: bool = False

746

) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

747

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

748

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

749

750

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

751

shape = op_shape4D.as_list() if op_shape4D else self.shape

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

752

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

753

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

754

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

755

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

756

assert c >= 0 and c < shape[idx]

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

757

coord = orig_coord

758

if op_shape4D and self.is_standard_fm:

759

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

760

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

761

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

762

storage_shape = self.storage_shape

763

coord = coord[-len(storage_shape) :]

764

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

765

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

766

if is_top_box:

767

coord = [c - 1 for c in coord]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

768

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

769

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

770

coord = [c % storage_shape[idx] for idx, c in enumerate(coord)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

771

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

772

strides, augmented_coord = self.get_strides_and_coord(coord, op_shape4D)

773

if strides is None:

774

return None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

775

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

776

if is_top_box:

777

address_offset += 1 * strides[-1] # one element

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

778

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

779

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

780

781

assert address_offset >= 0

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

782

assert address_offset <= storage_size

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

783

return address_offset

784

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

785

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

786

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

787

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

788

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

789

return self.equivalence_id == tens.equivalence_id

790

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

791

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

792

self.shape = shape

793

self.storage_shape = shape

794

self.bandwidth_shape = shape

795

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

796

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

797

d = len(self.shape)

798

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

799

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

800

elif d == 2:

801

return [self.shape[0], 1, 1, self.shape[1]]

802

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

803

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

804

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

805

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

806

# a tensor is quantized if it has an integral type and it contains valid quantization params

807

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

808

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

809

return False

810

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

811

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

812

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

813

def get_scalar(self):

814

"""

815

return: Unquantized or dequantized scalar value

816

rtype: self.dtype (if unquantized) or float (if dequantized)

817

"""

818

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

819

if self.is_quantized():

820

return self.quantization.dequantize(self.values).item(0)

821

else:

822

return self.values.item(0)

823

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

824

def __lt__(self, other: "Tensor") -> bool:

825

return self.equivalence_id < other.equivalence_id

826

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

827

def __str__(self):

828

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

829

830

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

831

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

832

def error(self, msg):

833

"""

834

Raises a VelaError exception for errors encountered when parsing a Tensor

835

836

:param self: Tensor object that resulted in the error

837

:param msg: str object that contains a description of the specific error encountered

838

"""

839

840

def _print_operators(ops):

841

lines = []

842

for idx, op in enumerate(ops):

843

op_type = getattr(op, "type", "Not an Operation")

844

op_id = getattr(op, "op_index", "-")

845

lines.append(f" {idx} = {op_type} ({op_id})")

846

return lines

847

848

lines = [f"Invalid {self.name} tensor. {msg}"]

849

850

lines += [" Driving operators:"]

851

lines += _print_operators(self.ops)

852

853

lines += [" Consuming operators:"]

854

lines += _print_operators(self.consumer_list)

855

856

raise VelaError("\n".join(lines))

857

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

858

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

859

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

860

# checks that the scaling of two quantized tensors are equal

861

Tim Hall