Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

39

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

120

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

121

self.value

122

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

124

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

125

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

126

self.value

127

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

128

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

129

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

130

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

131

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

132

133

134

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

143

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

144

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

145

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

146

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

147

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

148

def all():

149

return (

150

TensorSubPurpose.Standard,

151

TensorSubPurpose.DoubleBuffer,

152

TensorSubPurpose.RollingBufferX,

153

TensorSubPurpose.RollingBufferY,

154

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

159

Unknown = 0

160

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

175

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

195

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

196

new_shp = list(shp)

197

198

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

199

for i in range(-1, -len(shp) - 1, -1):

200

if new_shp[i] is not None:

201

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

205

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

206

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

207

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

211

class QuantizationParameters:

212

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

213

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

214

def __init__(

215

self,

216

min: Union[float, np.ndarray, None] = None,

217

max: Union[float, np.ndarray, None] = None,

218

num_bits=None,

219

narrow_range=None,

220

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

225

self.narrow_range = narrow_range

226

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

227

self.scale_f32: Union[float, np.ndarray, None] = None

228

self.zero_point: Union[int, np.ndarray, None] = None

229

self.quant_min: Optional[float] = None

230

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

231

232

def __str__(self):

233

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

243

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

244

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

249

res.narrow_range = self.narrow_range

250

251

res.scale_f32 = self.scale_f32

252

res.zero_point = self.zero_point

253

res.quant_min = self.quant_min

254

res.quant_max = self.quant_max

255

return res

256

257

def dequantize(self, values):

258

if self.zero_point.size == 1 and self.scale_f32.size == 1:

259

# same scale is used for all values

260

res = (values.astype(np.float64) - self.zero_point) * self.scale_f32

261

else:

262

# a different scale is used for different sets of values

263

values_as_float = values.astype(np.float64)

264

265

# this is not compatible with the format of depthwise weights,

266

# where input is at index 3 (Output, Kh, Kw, Input)

267

# return the quantized values

268

return np.ndarray((values_as_float.shape))

269

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

270

return res

271

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

272

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

273

# quantisation parameter scaling is not equal if 'other' is None because

274

# it implies that the tensor it belongs to is not quantised. otherwise,

275

# it depends upon whether the scale and zero point are equal

276

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

277

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

278

return False

279

280

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

281

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

282

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

283

# quantisation parameters are consider valid if they have a scale and zero point

284

285

return None not in (self.scale_f32, self.zero_point)

286

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

287

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

288

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

289

for attr in ("scale_f32", "zero_point", "min", "max"):

290

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

294

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

295

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

301

purpose: TensorPurpose = TensorPurpose.Unknown,

302

quantization: QuantizationParameters = None,

Dwight Lidman

9b37918

2021-03-15 19:06:10 +0100

[diff] [blame]

303

quant_value_dtype: np.dtype = None,

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

304

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

305

# Tensor

306

const_tensor = Tensor(shape, dtype, name + "_0")

307

const_tensor.purpose = purpose

308

const_tensor.quantization = quantization

309

const_tensor.values = np.array(values, dtype=value_dtype)

Dwight Lidman

9b37918

2021-03-15 19:06:10 +0100

[diff] [blame]

310

const_tensor.quant_values = np.frombuffer(

311

const_tensor.values.tobytes(), dtype=np.uint8 if not quant_value_dtype else quant_value_dtype

312

)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

313

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

314

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

315

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

316

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

320

# class that keeps track of all tensor addresses in the different memory types

321

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

322

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

323

324

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

325

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

326

return cls.address_map[tens_id].get(mem_type)

327

328

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

329

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

330

# Check previous address if there is one

331

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

332

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

333

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

334

335

# Set tensor's address for memory type

336

cls.address_map[tens_id][mem_type] = address

337

338

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

339

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

347

"is_variable",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"ops",

"consumer_list",

"values",

"quant_values",

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

353

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

354

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

355

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

361

"storage_compression_scale",

362

"bandwidth_compression_scale",

363

"compression_scale_for_worst_weight_stream",

364

"weight_compression_scales",

365

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

366

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

367

"storage_rounding_quantum",

368

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

369

"quantization",

370

"weight_compressed_offsets",

371

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

372

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

374

"resampling_mode",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame^]

375

"needs_linear_format",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

376

)

377

AllocationQuantum = 16

378

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

379

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

380

self.shape = shape

381

self.storage_shape = shape

382

self.bandwidth_shape = shape

383

self.dtype = dtype

384

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

385

self.is_variable = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

386

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

387

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

388

self.ops: List[Operation] = []

389

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

390

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

391

self.values: Optional[np.ndarray] = None

392

self.quant_values: Optional[np.ndarray] = None

393

self.compressed_values: Optional[np.ndarray] = None

394

self.compressed_values_substream_offsets: Optional[List] = None

395

self.mem_area: MemArea = MemArea.Unknown

396

self.mem_type: MemType = MemType.Unknown

397

self.format: TensorFormat = TensorFormat.Unknown

398

self.purpose: TensorPurpose = TensorPurpose.Unknown

399

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

400

self.alignment: int = Tensor.AllocationQuantum

401

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

402

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

403

self.storage_compression_scale: float = 1.0

404

self.bandwidth_compression_scale: float = 1.0

405

self.compression_scale_for_worst_weight_stream: float = 1.0

406

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

407

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

408

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

409

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

410

self.value_id: UUID = uuid.uuid4()

411

self.weight_compressed_offsets: List = []

412

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

413

self.brick_size: Tuple = (1, 1, 1, 1)

414

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

415

416

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

417

self.quantization: Optional[QuantizationParameters] = None

418

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

419

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

420

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame^]

421

self.needs_linear_format = True

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

422

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

423

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

424

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

425

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

426

427

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

428

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

429

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

430

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

431

@property

432

def is_standard_fm(self) -> bool:

433

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

434

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

435

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

436

if self.element_size_bytes == 0:

437

return self.dtype.size_in_bits() / 8

438

return self.element_size_bytes

439

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

440

# Returns a copy, renamed to self.name + suffix

441

# The references to Operators will be empty when returned

442

# Depending on set_unique, the copy is shallow, or deep

443

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

444

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

445

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

446

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

447

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

448

res.storage_shape = list(self.storage_shape)

449

res.bandwidth_shape = list(self.bandwidth_shape)

450

if self.quantization is not None:

451

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

452

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

453

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

454

res.ops = []

455

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

456

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

457

return res

458

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

459

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

460

res = self.clone(suffix="_fast_storage")

461

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

462

res.mem_type = MemType.Scratch_fast

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

463

return res

464

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

465

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

466

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

467

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

468

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

469

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

470

self.storage_shape = src_tens.storage_shape

471

self.brick_size = src_tens.brick_size

472

self.weight_compression_scales = src_tens.weight_compression_scales

473

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

474

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

475

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

476

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

477

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

478

self.block_traversal = src_tens.block_traversal

479

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

480

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

481

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

482

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

490

if shape_len > 4:

491

return

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

492

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

493

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

494

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

495

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

496

if self.shape is None:

497

return

498

499

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

500

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

501

502

if fmt == TensorFormat.WeightsCompressed:

503

compression_ratio = 5 / 8

504

self.storage_compression_scale = compression_ratio

505

self.bandwidth_compression_scale = compression_ratio

506

self.compression_scale_for_worst_weight_stream = compression_ratio

507

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

508

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

509

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

514

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

515

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

520

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

521

return shape_fully_defined(self.shape)

522

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

523

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

524

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

525

if raw_size == 0:

526

raw_size = 1 # force it to take up space

527

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

528

return rounded_size

529

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

530

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

531

elems = shape_num_elements(op_storage_shape)

532

elems = elems if elems else 0

533

raw_size = elems * self.element_size()

534

if raw_size == 0:

535

raw_size = 1 # force it to take up space

536

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

537

return rounded_size

538

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

539

def storage_size_for_sub_purpose(

540

self, arch, sub_purpose: TensorSubPurpose, param_a: Optional[int] = None, param_b: Optional[int] = None

541

) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

542

alt_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

543

elems = shape_num_elements(alt_shape)

544

if elems is None:

545

return 0

546

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

547

raw_size = (

548

elems

549

* self.element_size()

550

* self.compression_scale_for_worst_weight_stream

551

* arch.weight_estimation_scaling

552

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

553

else:

Patrik Gustavsson

9baa4c3

2020-08-20 13:59:01 +0200

[diff] [blame]

554

# Rolling buffers are used for intermediate data in ifm streaming

555

# These will all use the NHCWB16 format, and need to be aligned to 16 in the C-dimension

556

if alt_shape[-1] % 16 != 0:

557

nhcwb16_shape = alt_shape[0:-1] + [numeric_util.round_up(alt_shape[-1], 16)]

558

elems = shape_num_elements(nhcwb16_shape)

559

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

560

raw_size = elems * self.element_size() * self.storage_compression_scale

561

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

562

return rounded_size

563

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

564

def storage_shape_for_sub_purpose(

565

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

566

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

567

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

568

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

569

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

570

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

571

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

572

else:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

573

shp = list(self.storage_shape)

574

if sub_purpose == TensorSubPurpose.RollingBufferX:

575

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

576

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

577

shp[0] = 1

578

shp[2] = min(shp[2], param_a)

579

elif sub_purpose == TensorSubPurpose.RollingBufferY:

580

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

581

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

582

shp[0] = 1

583

shp[1] = min(shp[1], param_a)

584

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

585

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

586

assert param_a is not None

587

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

588

shp[0] = 1

589

shp[2] = min(shp[2], param_a)

590

shp[1] = min(shp[1], param_b)

591

elif sub_purpose == TensorSubPurpose.Standard:

592

pass

593

else:

594

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

595

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

596

return shp

597

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

598

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

599

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

600

self.sub_purpose = sub_purpose

601

if sub_purpose == TensorSubPurpose.DoubleBuffer:

602

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

603

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

604

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

605

elems = shape_num_elements(self.bandwidth_shape)

606

if elems is None:

607

return 0

608

return elems * self.element_size() * self.bandwidth_compression_scale

609

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

610

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

611

return self.consumer_list

612

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

613

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

614

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

615

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

616

617

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, op_shape4D: Shape4D) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

618

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

619

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

620

if self.storage_shape == []:

return (

1,

1,

1,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

625

[self.address_for_coordinate(start_coord, op_shape4D=op_shape4D), None, None, None],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

626

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

627

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

628

if self.is_standard_fm:

629

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

630

else:

631

storage_shape_4D = Shape4D(self.storage_shape)

632

633

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

634

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

635

636

crossing_y = min(crossing_y, end_coord[1])

637

crossing_x = min(crossing_x, end_coord[2])

638

639

box_height0 = crossing_y - start_coord[1]

640

box_width = crossing_x - start_coord[2]

641

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

642

addresses: List = [None] * 4

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

643

addresses[0] = self.address_for_coordinate(start_coord, op_shape4D=op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

644

645

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

646

addresses[1] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

647

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

648

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

649

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

650

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

651

addresses[2] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

652

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

653

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

654

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

655

addresses[3] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

656

[start_coord[0], crossing_y, crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

657

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

658

659

return box_height0, box_height0, box_width, addresses

660

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

661

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, op_shape4D: Shape4D = None) -> int:

662

offset = self.address_offset_for_coordinate(coord, op_shape4D=op_shape4D, is_top_box=is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

663

assert offset is not None

664

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

665

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

666

def get_strides_and_coord(

667

self, coord: Optional[Shape] = None, shape4D: Optional[Shape4D] = None

668

) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

669

if coord is None:

670

coord = [0] * len(self.storage_shape)

671

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

672

if shape4D and self.is_standard_fm:

673

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

674

else:

675

augmented_shape = full_shape(4, self.storage_shape, 1)

676

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

677

augmented_coord = coord

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

678

679

while len(augmented_coord) < 4:

680

augmented_coord = [0] + augmented_coord

681

682

assert len(augmented_coord) == len(augmented_shape)

683

684

if self.format == TensorFormat.NHWC:

685

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

686

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

687

688

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

689

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

690

augmented_shape = augmented_shape[0:4] + [1]

691

augmented_coord = (

692

[augmented_coord[0], augmented_coord[3] // channel_divisor]

693

+ augmented_coord[1:3]

694

+ [augmented_coord[3] % channel_divisor]

695

)

696

697

if augmented_shape[1] == 0:

698

augmented_shape[1] = 1

699

700

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

701

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

702

return None, None

703

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

704

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

705

stride = self.element_size() * self.storage_compression_scale

706

707

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

708

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

709

for i in stride_order:

710

strides[i] = stride

711

stride *= augmented_shape[i]

712

else:

713

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

714

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

715

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

716

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

717

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

718

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

719

720

return strides, augmented_coord

721

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

722

def get_strides(self, shape4D: Optional[Shape4D] = None) -> Shape:

723

strides, _ = self.get_strides_and_coord(shape4D=shape4D)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

724

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

725

return strides

726

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

727

def needs_dma(self) -> bool:

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

728

return len(self.ops) == 1 and self.ops[0].type == Op.DMA

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

729

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

730

def get_dma_src_tensor(self) -> "Optional[Tensor]":

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

731

# For weight tensors that need DMA: returns the source tensor in Flash, else None

732

# Note: for DMA ops, Pass.weight_tensor is referring to the SRAM weight tensor

733

return self.ops[0].inputs[0] if self.needs_dma() else None

734

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

735

def find_npu_op(self) -> Optional[Operation]:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

736

# Returns the NPU operator that uses this tensor, excluding DMA operators.

737

for op in self.consumers():

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

738

if op.type == Op.DMA:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

739

return op.outputs[0].find_npu_op()

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

740

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

741

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

742

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

743

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

744

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

745

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

746

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

747

assert len(self.compressed_values) > 0

748

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

749

750

depth = coord[-1]

751

brick_depth = self.brick_size[-1]

752

# Clamp position at final element index

753

if depth > self.shape[-1]:

754

depth = self.shape[-1]

755

756

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

757

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

758

759

# Check boundaries on all but last weight set (which may be shorter

760

# than the brick we divided it up into)

761

if index < len(self.weight_compressed_offsets) - 1:

762

# There are no half-way points in the weights

763

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

764

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

768

def size_of_compressed_stream(self, index: int) -> int:

769

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

770

assert 0 <= index < len(self.compressed_values)

771

return len(self.compressed_values[index])

772

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

773

def is_last_index_in_compressed_stream(self, index: int) -> bool:

774

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

775

assert 0 <= index < len(self.compressed_values)

776

return index == len(self.compressed_values) - 1

777

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

778

def address_offset_for_coordinate(

779

self, orig_coord: Shape, op_shape4D: Optional[Shape4D] = None, is_top_box: bool = False

780

) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

781

address_offset = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

782

783

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

784

shape = op_shape4D.as_list() if op_shape4D else self.shape

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

785

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

786

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

787

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

788

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

789

assert c >= 0 and c < shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

790

791

if self.format == TensorFormat.WeightsCompressed:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

792

storage_size = self.storage_size()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

793

if len(self.weight_compressed_offsets) == 0:

794

return 0

795

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

796

if self.needs_dma() and self.sub_purpose == TensorSubPurpose.DoubleBuffer:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

797

depth = orig_coord[-1]

798

brick_depth = self.brick_size[-1]

799

# Clamp position at final element index

800

if depth > self.shape[-1]:

801

depth = self.shape[-1]

802

803

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

804

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

805

index = index % 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

806

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

807

808

if len(self.compressed_values) <= 2:

809

if is_top_box and index == 0:

810

for cv in self.compressed_values:

811

address_offset += len(cv)

812

else:

813

address_offset = index * len(self.compressed_values[0])

814

else:

815

if is_top_box and index == 0:

816

address_offset = self.storage_shape[-1]

817

else:

818

address_offset = index * (self.storage_shape[-1] // 2)

819

else:

820

index = self.compressed_stream_index_from_coord(orig_coord)

821

assert index < len(self.weight_compressed_offsets)

822

address_offset = self.weight_compressed_offsets[index]

823

else:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

824

coord = orig_coord

825

if op_shape4D and self.is_standard_fm:

826

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

827

storage_size = self.storage_size_for_shape(storage_shape)

828

else:

829

storage_shape = self.storage_shape

830

coord = coord[-len(storage_shape) :]

831

storage_size = self.storage_size()

832

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

833

if is_top_box:

834

coord = [c - 1 for c in coord]

835

836

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

837

coord = [c % storage_shape[idx] for idx, c in enumerate(coord)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

838

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

839

strides, augmented_coord = self.get_strides_and_coord(coord, op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if strides is None:

return None

if is_top_box:

address_offset += 1 * strides[-1] # one element

845

846

address_offset += np.dot(augmented_coord, strides)

847

848

assert address_offset >= 0

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

849

assert address_offset <= storage_size

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

850

return address_offset

851

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

852

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

853

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

854

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

855

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

856

return self.equivalence_id == tens.equivalence_id

857

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

858

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

859

self.shape = shape

860

self.storage_shape = shape

861

self.bandwidth_shape = shape

862

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

863

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

864

d = len(self.shape)

865

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

866

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

867

elif d == 2:

868

return [self.shape[0], 1, 1, self.shape[1]]

869

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

870

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

871

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

872

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

873

# a tensor is quantized if it has an integral type and it contains valid quantization params

874

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

875

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

876

return False

877

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

878

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

879

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

880

def __lt__(self, other: "Tensor") -> bool:

881

return self.equivalence_id < other.equivalence_id

882

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

883

def __str__(self):

884

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

885

886

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

887

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

888

def error(self, msg):

889

"""

890

Raises a VelaError exception for errors encountered when parsing a Tensor

891

892

:param self: Tensor object that resulted in the error

893

:param msg: str object that contains a description of the specific error encountered

894

"""

895

896

def _print_operators(ops):

897

lines = []

898

for idx, op in enumerate(ops):

899

op_type = getattr(op, "type", "Not an Operation")

900

op_id = getattr(op, "op_index", "-")

901

lines.append(f" {idx} = {op_type} ({op_id})")

902

return lines

903

904

lines = [f"Invalid {self.name} tensor. {msg}"]

905

906

lines += [" Driving operators:"]

907

lines += _print_operators(self.ops)

908

909

lines += [" Consuming operators:"]

910

lines += _print_operators(self.consumer_list)

911

912

raise VelaError("\n".join(lines))

913

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

914

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

915

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

916

# checks that the scaling of two quantized tensors are equal

917

Tim Hall