Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

39

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

120

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

121

self.value

122

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

124

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

125

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

126

self.value

127

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

128

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

129

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

130

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

131

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

132

133

134

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

143

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

144

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

145

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

146

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

147

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

148

def all():

149

return (

150

TensorSubPurpose.Standard,

151

TensorSubPurpose.DoubleBuffer,

152

TensorSubPurpose.RollingBufferX,

153

TensorSubPurpose.RollingBufferY,

154

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

159

Unknown = 0

160

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

175

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

195

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

196

new_shp = list(shp)

197

198

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

199

for i in range(-1, -len(shp) - 1, -1):

200

if new_shp[i] is not None:

201

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

205

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

206

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

207

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

211

class QuantizationParameters:

212

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

213

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

214

def __init__(

215

self,

216

min: Union[float, np.ndarray, None] = None,

217

max: Union[float, np.ndarray, None] = None,

218

num_bits=None,

219

narrow_range=None,

220

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

225

self.narrow_range = narrow_range

226

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

227

self.scale_f32: Union[float, np.ndarray, None] = None

228

self.zero_point: Union[int, np.ndarray, None] = None

229

self.quant_min: Optional[float] = None

230

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

231

232

def __str__(self):

233

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

243

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

244

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

249

res.narrow_range = self.narrow_range

250

251

res.scale_f32 = self.scale_f32

252

res.zero_point = self.zero_point

253

res.quant_min = self.quant_min

254

res.quant_max = self.quant_max

255

return res

256

257

def dequantize(self, values):

258

if self.zero_point.size == 1 and self.scale_f32.size == 1:

259

# same scale is used for all values

260

res = (values.astype(np.float64) - self.zero_point) * self.scale_f32

261

else:

262

# a different scale is used for different sets of values

263

values_as_float = values.astype(np.float64)

264

265

# this is not compatible with the format of depthwise weights,

266

# where input is at index 3 (Output, Kh, Kw, Input)

267

# return the quantized values

268

return np.ndarray((values_as_float.shape))

269

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

270

return res

271

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

272

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

273

# quantisation parameter scaling is not equal if 'other' is None because

274

# it implies that the tensor it belongs to is not quantised. otherwise,

275

# it depends upon whether the scale and zero point are equal

276

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

277

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

278

return False

279

280

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

281

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

282

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

283

# quantisation parameters are consider valid if they have a scale and zero point

284

285

return None not in (self.scale_f32, self.zero_point)

286

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

287

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

288

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

289

for attr in ("scale_f32", "zero_point", "min", "max"):

290

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

294

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

295

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

301

purpose: TensorPurpose = TensorPurpose.Unknown,

302

quantization: QuantizationParameters = None,

303

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

304

# Tensor

305

const_tensor = Tensor(shape, dtype, name + "_0")

306

const_tensor.purpose = purpose

307

const_tensor.quantization = quantization

308

const_tensor.values = np.array(values, dtype=value_dtype)

Jacob Bohlin

a41cd4d

2020-08-26 18:21:28 +0200

[diff] [blame]

309

const_tensor.quant_values = np.frombuffer(const_tensor.values.tobytes(), dtype=np.uint8)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

310

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

311

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

312

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

313

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

317

# class that keeps track of all tensor addresses in the different memory types

318

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

319

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

320

321

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

322

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

323

return cls.address_map[tens_id].get(mem_type)

324

325

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

326

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

327

# Check previous address if there is one

328

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

329

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

330

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

331

332

# Set tensor's address for memory type

333

cls.address_map[tens_id][mem_type] = address

334

335

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

336

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame^]

344

"is_variable",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"ops",

"consumer_list",

"values",

"quant_values",

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

350

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

351

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

352

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

358

"storage_compression_scale",

359

"bandwidth_compression_scale",

360

"compression_scale_for_worst_weight_stream",

361

"weight_compression_scales",

362

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

363

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

364

"storage_rounding_quantum",

365

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

366

"quantization",

367

"weight_compressed_offsets",

368

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

369

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

370

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

371

"resampling_mode",

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

372

"avoid_NHCWB16",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

)

374

AllocationQuantum = 16

375

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

376

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

377

self.shape = shape

378

self.storage_shape = shape

379

self.bandwidth_shape = shape

380

self.dtype = dtype

381

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame^]

382

self.is_variable = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

383

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

384

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

385

self.ops: List[Operation] = []

386

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

387

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

388

self.values: Optional[np.ndarray] = None

389

self.quant_values: Optional[np.ndarray] = None

390

self.compressed_values: Optional[np.ndarray] = None

391

self.compressed_values_substream_offsets: Optional[List] = None

392

self.mem_area: MemArea = MemArea.Unknown

393

self.mem_type: MemType = MemType.Unknown

394

self.format: TensorFormat = TensorFormat.Unknown

395

self.purpose: TensorPurpose = TensorPurpose.Unknown

396

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

397

self.alignment: int = Tensor.AllocationQuantum

398

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

399

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

400

self.storage_compression_scale: float = 1.0

401

self.bandwidth_compression_scale: float = 1.0

402

self.compression_scale_for_worst_weight_stream: float = 1.0

403

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

404

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

406

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

407

self.value_id: UUID = uuid.uuid4()

408

self.weight_compressed_offsets: List = []

409

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

410

self.brick_size: Tuple = (1, 1, 1, 1)

411

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

412

413

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

414

self.quantization: Optional[QuantizationParameters] = None

415

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

416

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

417

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

418

self.avoid_NHCWB16: bool = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

419

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

420

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

421

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

422

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

423

424

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

425

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

426

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

427

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

428

@property

429

def is_standard_fm(self) -> bool:

430

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

431

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

432

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

433

if self.element_size_bytes == 0:

434

return self.dtype.size_in_bits() / 8

435

return self.element_size_bytes

436

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

437

# Returns a copy, renamed to self.name + suffix

438

# The references to Operators will be empty when returned

439

# Depending on set_unique, the copy is shallow, or deep

440

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

441

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

442

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

443

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

444

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

445

res.storage_shape = list(self.storage_shape)

446

res.bandwidth_shape = list(self.bandwidth_shape)

447

if self.quantization is not None:

448

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

449

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

450

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

451

res.ops = []

452

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

453

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

454

return res

455

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

456

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

457

res = self.clone(suffix="_fast_storage")

458

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

459

res.mem_type = MemType.Scratch_fast

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

460

return res

461

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

462

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

463

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

464

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

465

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

466

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

467

self.storage_shape = src_tens.storage_shape

468

self.brick_size = src_tens.brick_size

469

self.weight_compression_scales = src_tens.weight_compression_scales

470

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

471

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

472

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

473

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

474

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

475

self.block_traversal = src_tens.block_traversal

476

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

477

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

478

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

479

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

487

if shape_len > 4:

488

return

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

489

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

490

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

491

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

492

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

493

if self.shape is None:

494

return

495

496

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

497

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

498

499

if fmt == TensorFormat.WeightsCompressed:

500

compression_ratio = 5 / 8

501

self.storage_compression_scale = compression_ratio

502

self.bandwidth_compression_scale = compression_ratio

503

self.compression_scale_for_worst_weight_stream = compression_ratio

504

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

505

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

506

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

511

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

512

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

517

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

518

return shape_fully_defined(self.shape)

519

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

520

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

521

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

522

if raw_size == 0:

523

raw_size = 1 # force it to take up space

524

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

525

return rounded_size

526

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

527

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

528

elems = shape_num_elements(op_storage_shape)

529

elems = elems if elems else 0

530

raw_size = elems * self.element_size()

531

if raw_size == 0:

532

raw_size = 1 # force it to take up space

533

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

534

return rounded_size

535

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

536

def storage_size_for_sub_purpose(

537

self, arch, sub_purpose: TensorSubPurpose, param_a: Optional[int] = None, param_b: Optional[int] = None

538

) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

539

alt_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

540

elems = shape_num_elements(alt_shape)

541

if elems is None:

542

return 0

543

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

544

raw_size = (

545

elems

546

* self.element_size()

547

* self.compression_scale_for_worst_weight_stream

548

* arch.weight_estimation_scaling

549

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

550

else:

Patrik Gustavsson

9baa4c3

2020-08-20 13:59:01 +0200

[diff] [blame]

551

# Rolling buffers are used for intermediate data in ifm streaming

552

# These will all use the NHCWB16 format, and need to be aligned to 16 in the C-dimension

553

if alt_shape[-1] % 16 != 0:

554

nhcwb16_shape = alt_shape[0:-1] + [numeric_util.round_up(alt_shape[-1], 16)]

555

elems = shape_num_elements(nhcwb16_shape)

556

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

557

raw_size = elems * self.element_size() * self.storage_compression_scale

558

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

559

return rounded_size

560

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

561

def storage_shape_for_sub_purpose(

562

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

563

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

564

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

565

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

566

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

567

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

568

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

569

else:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

570

shp = list(self.storage_shape)

571

if sub_purpose == TensorSubPurpose.RollingBufferX:

572

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

573

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

574

shp[0] = 1

575

shp[2] = min(shp[2], param_a)

576

elif sub_purpose == TensorSubPurpose.RollingBufferY:

577

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

578

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

579

shp[0] = 1

580

shp[1] = min(shp[1], param_a)

581

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

582

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

583

assert param_a is not None

584

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

585

shp[0] = 1

586

shp[2] = min(shp[2], param_a)

587

shp[1] = min(shp[1], param_b)

588

elif sub_purpose == TensorSubPurpose.Standard:

589

pass

590

else:

591

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

592

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

593

return shp

594

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

595

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

596

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

597

self.sub_purpose = sub_purpose

598

if sub_purpose == TensorSubPurpose.DoubleBuffer:

599

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

600

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

601

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

602

elems = shape_num_elements(self.bandwidth_shape)

603

if elems is None:

604

return 0

605

return elems * self.element_size() * self.bandwidth_compression_scale

606

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

607

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

608

return self.consumer_list

609

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

610

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

611

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

612

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

613

614

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, op_shape4D: Shape4D) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

615

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

616

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

617

if self.storage_shape == []:

return (

1,

1,

1,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

622

[self.address_for_coordinate(start_coord, op_shape4D=op_shape4D), None, None, None],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

623

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

624

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

625

if self.is_standard_fm:

626

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

627

else:

628

storage_shape_4D = Shape4D(self.storage_shape)

629

630

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

631

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

632

633

crossing_y = min(crossing_y, end_coord[1])

634

crossing_x = min(crossing_x, end_coord[2])

635

636

box_height0 = crossing_y - start_coord[1]

637

box_width = crossing_x - start_coord[2]

638

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

639

addresses: List = [None] * 4

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

640

addresses[0] = self.address_for_coordinate(start_coord, op_shape4D=op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

641

642

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

643

addresses[1] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

644

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

645

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

646

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

647

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

648

addresses[2] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

649

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

650

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

651

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

652

addresses[3] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

653

[start_coord[0], crossing_y, crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

654

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

655

656

return box_height0, box_height0, box_width, addresses

657

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

658

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, op_shape4D: Shape4D = None) -> int:

659

offset = self.address_offset_for_coordinate(coord, op_shape4D=op_shape4D, is_top_box=is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

660

assert offset is not None

661

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

662

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

663

def get_strides_and_coord(

664

self, coord: Optional[Shape] = None, shape4D: Optional[Shape4D] = None

665

) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

666

if coord is None:

667

coord = [0] * len(self.storage_shape)

668

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

669

if shape4D and self.is_standard_fm:

670

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

671

else:

672

augmented_shape = full_shape(4, self.storage_shape, 1)

673

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

674

augmented_coord = coord

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

675

676

while len(augmented_coord) < 4:

677

augmented_coord = [0] + augmented_coord

678

679

assert len(augmented_coord) == len(augmented_shape)

680

681

if self.format == TensorFormat.NHWC:

682

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

683

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

684

685

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

686

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

687

augmented_shape = augmented_shape[0:4] + [1]

688

augmented_coord = (

689

[augmented_coord[0], augmented_coord[3] // channel_divisor]

690

+ augmented_coord[1:3]

691

+ [augmented_coord[3] % channel_divisor]

692

)

693

694

if augmented_shape[1] == 0:

695

augmented_shape[1] = 1

696

697

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

698

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

699

return None, None

700

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

701

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

702

stride = self.element_size() * self.storage_compression_scale

703

704

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

705

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

706

for i in stride_order:

707

strides[i] = stride

708

stride *= augmented_shape[i]

709

else:

710

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

711

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

712

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

713

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

714

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

715

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

716

717

return strides, augmented_coord

718

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

719

def get_strides(self, shape4D: Optional[Shape4D] = None) -> Shape:

720

strides, _ = self.get_strides_and_coord(shape4D=shape4D)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

721

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

722

return strides

723

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

724

def needs_dma(self) -> bool:

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

725

return len(self.ops) == 1 and self.ops[0].type == Op.DMA

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

726

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

727

def get_dma_src_tensor(self) -> "Optional[Tensor]":

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

728

# For weight tensors that need DMA: returns the source tensor in Flash, else None

729

# Note: for DMA ops, Pass.weight_tensor is referring to the SRAM weight tensor

730

return self.ops[0].inputs[0] if self.needs_dma() else None

731

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

732

def find_npu_op(self) -> Optional[Operation]:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

733

# Returns the NPU operator that uses this tensor, excluding DMA operators.

734

for op in self.consumers():

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

735

if op.type == Op.DMA:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

736

return op.outputs[0].find_npu_op()

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

737

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

738

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

739

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

740

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

741

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

742

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

743

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

744

assert len(self.compressed_values) > 0

745

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

746

747

depth = coord[-1]

748

brick_depth = self.brick_size[-1]

749

# Clamp position at final element index

750

if depth > self.shape[-1]:

751

depth = self.shape[-1]

752

753

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

754

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

755

756

# Check boundaries on all but last weight set (which may be shorter

757

# than the brick we divided it up into)

758

if index < len(self.weight_compressed_offsets) - 1:

759

# There are no half-way points in the weights

760

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

761

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

765

def size_of_compressed_stream(self, index: int) -> int:

766

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

767

assert 0 <= index < len(self.compressed_values)

768

return len(self.compressed_values[index])

769

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

770

def is_last_index_in_compressed_stream(self, index: int) -> bool:

771

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

772

assert 0 <= index < len(self.compressed_values)

773

return index == len(self.compressed_values) - 1

774

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

775

def address_offset_for_coordinate(

776

self, orig_coord: Shape, op_shape4D: Optional[Shape4D] = None, is_top_box: bool = False

777

) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

778

address_offset = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

779

780

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

781

shape = op_shape4D.as_list() if op_shape4D else self.shape

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

782

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

783

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

784

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

785

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

786

assert c >= 0 and c < shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

787

788

if self.format == TensorFormat.WeightsCompressed:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

789

storage_size = self.storage_size()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

790

if len(self.weight_compressed_offsets) == 0:

791

return 0

792

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

793

if self.needs_dma() and self.sub_purpose == TensorSubPurpose.DoubleBuffer:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

794

depth = orig_coord[-1]

795

brick_depth = self.brick_size[-1]

796

# Clamp position at final element index

797

if depth > self.shape[-1]:

798

depth = self.shape[-1]

799

800

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

801

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

802

index = index % 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

803

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

804

805

if len(self.compressed_values) <= 2:

806

if is_top_box and index == 0:

807

for cv in self.compressed_values:

808

address_offset += len(cv)

809

else:

810

address_offset = index * len(self.compressed_values[0])

811

else:

812

if is_top_box and index == 0:

813

address_offset = self.storage_shape[-1]

814

else:

815

address_offset = index * (self.storage_shape[-1] // 2)

816

else:

817

index = self.compressed_stream_index_from_coord(orig_coord)

818

assert index < len(self.weight_compressed_offsets)

819

address_offset = self.weight_compressed_offsets[index]

820

else:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

821

coord = orig_coord

822

if op_shape4D and self.is_standard_fm:

823

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

824

storage_size = self.storage_size_for_shape(storage_shape)

825

else:

826

storage_shape = self.storage_shape

827

coord = coord[-len(storage_shape) :]

828

storage_size = self.storage_size()

829

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

830

if is_top_box:

831

coord = [c - 1 for c in coord]

832

833

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

834

coord = [c % storage_shape[idx] for idx, c in enumerate(coord)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

835

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

836

strides, augmented_coord = self.get_strides_and_coord(coord, op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if strides is None:

return None

if is_top_box:

address_offset += 1 * strides[-1] # one element

842

843

address_offset += np.dot(augmented_coord, strides)

844

845

assert address_offset >= 0

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

846

assert address_offset <= storage_size

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

847

return address_offset

848

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

849

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

850

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

851

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

852

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

853

return self.equivalence_id == tens.equivalence_id

854

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

855

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

856

self.shape = shape

857

self.storage_shape = shape

858

self.bandwidth_shape = shape

859

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

860

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

861

d = len(self.shape)

862

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

863

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

864

elif d == 2:

865

return [self.shape[0], 1, 1, self.shape[1]]

866

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

867

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

868

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

869

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

870

# a tensor is quantized if it has an integral type and it contains valid quantization params

871

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

872

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

873

return False

874

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

875

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

876

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

877

def __lt__(self, other: "Tensor") -> bool:

878

return self.equivalence_id < other.equivalence_id

879

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

880

def __str__(self):

881

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

882

883

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

884

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

885

def error(self, msg):

886

"""

887

Raises a VelaError exception for errors encountered when parsing a Tensor

888

889

:param self: Tensor object that resulted in the error

890

:param msg: str object that contains a description of the specific error encountered

891

"""

892

893

def _print_operators(ops):

894

lines = []

895

for idx, op in enumerate(ops):

896

op_type = getattr(op, "type", "Not an Operation")

897

op_id = getattr(op, "op_index", "-")

898

lines.append(f" {idx} = {op_type} ({op_id})")

899

return lines

900

901

lines = [f"Invalid {self.name} tensor. {msg}"]

902

903

lines += [" Driving operators:"]

904

lines += _print_operators(self.ops)

905

906

lines += [" Consuming operators:"]

907

lines += _print_operators(self.consumer_list)

908

909

raise VelaError("\n".join(lines))

910

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

911

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

912

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

913

# checks that the scaling of two quantized tensors are equal

914

Tim Hall