Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

1

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

39

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame^]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame^]

120

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

121

self.value

122

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

124

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame^]

125

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

126

self.value

127

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

128

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

129

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

130

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

131

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

132

133

134

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

143

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

144

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

145

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

146

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

147

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

148

def all():

149

return (

150

TensorSubPurpose.Standard,

151

TensorSubPurpose.DoubleBuffer,

152

TensorSubPurpose.RollingBufferX,

153

TensorSubPurpose.RollingBufferY,

154

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

159

Unknown = 0

160

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

175

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

195

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

196

new_shp = list(shp)

197

198

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

199

for i in range(-1, -len(shp) - 1, -1):

200

if new_shp[i] is not None:

201

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

205

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

206

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

207

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

211

class QuantizationParameters:

212

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

213

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

214

def __init__(

215

self,

216

min: Union[float, np.ndarray, None] = None,

217

max: Union[float, np.ndarray, None] = None,

218

num_bits=None,

219

narrow_range=None,

220

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

225

self.narrow_range = narrow_range

226

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

227

self.scale_f32: Union[float, np.ndarray, None] = None

228

self.zero_point: Union[int, np.ndarray, None] = None

229

self.quant_min: Optional[float] = None

230

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

231

232

def __str__(self):

233

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

243

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

244

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

249

res.narrow_range = self.narrow_range

250

251

res.scale_f32 = self.scale_f32

252

res.zero_point = self.zero_point

253

res.quant_min = self.quant_min

254

res.quant_max = self.quant_max

255

return res

256

257

def dequantize(self, values):

258

if self.zero_point.size == 1 and self.scale_f32.size == 1:

259

# same scale is used for all values

260

res = (values.astype(np.float64) - self.zero_point) * self.scale_f32

261

else:

262

# a different scale is used for different sets of values

263

values_as_float = values.astype(np.float64)

264

265

# this is not compatible with the format of depthwise weights,

266

# where input is at index 3 (Output, Kh, Kw, Input)

267

# return the quantized values

268

return np.ndarray((values_as_float.shape))

269

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

270

return res

271

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

272

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

273

# quantisation parameter scaling is not equal if 'other' is None because

274

# it implies that the tensor it belongs to is not quantised. otherwise,

275

# it depends upon whether the scale and zero point are equal

276

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

277

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

278

return False

279

280

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

281

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

282

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

283

# quantisation parameters are consider valid if they have a scale and zero point

284

285

return None not in (self.scale_f32, self.zero_point)

286

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

287

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

288

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

289

for attr in ("scale_f32", "zero_point", "min", "max"):

290

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

294

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

295

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

301

purpose: TensorPurpose = TensorPurpose.Unknown,

302

quantization: QuantizationParameters = None,

303

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

304

# Tensor

305

const_tensor = Tensor(shape, dtype, name + "_0")

306

const_tensor.purpose = purpose

307

const_tensor.quantization = quantization

308

const_tensor.values = np.array(values, dtype=value_dtype)

Jacob Bohlin

a41cd4d

2020-08-26 18:21:28 +0200

[diff] [blame]

309

const_tensor.quant_values = np.frombuffer(const_tensor.values.tobytes(), dtype=np.uint8)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

310

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

311

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

312

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

313

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

def create_reshape_tensor(tens, shape, ifm_reshape=True):

318

if shape == tens.shape:

319

return tens

320

# Tensors

321

name = tens.name + "_reshape"

322

reshape_ifm = tens

323

reshape_ofm = tens.clone("_reshaped")

324

reshape_ofm.set_all_shapes(shape)

325

if not ifm_reshape:

326

reshape_ifm, reshape_ofm = reshape_ofm, reshape_ifm

327

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

328

reshape_op = Operation(Op.Reshape, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

329

reshape_op.attrs["new_shape"] = shape

330

reshape_op.add_input_tensor(reshape_ifm)

331

reshape_op.add_input_tensor(create_const_tensor(name + "_shape", [1], DataType.int32, shape))

332

reshape_op.set_output_tensor(reshape_ofm)

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

333

reshape_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

334

return reshape_ofm if ifm_reshape else reshape_ifm

335

336

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

337

# class that keeps track of all tensor addresses in the different memory types

338

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

339

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

340

341

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

342

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

343

return cls.address_map[tens_id].get(mem_type)

344

345

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

346

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

347

# Check previous address if there is one

348

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

349

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

350

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

351

352

# Set tensor's address for memory type

353

cls.address_map[tens_id][mem_type] = address

354

355

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

356

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

"ops",

"consumer_list",

"values",

"quant_values",

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

369

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

370

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

371

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

377

"storage_compression_scale",

378

"bandwidth_compression_scale",

379

"compression_scale_for_worst_weight_stream",

380

"weight_compression_scales",

381

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

382

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

383

"storage_rounding_quantum",

384

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

385

"quantization",

386

"weight_compressed_offsets",

387

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

388

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

389

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

390

"resampling_mode",

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

391

"avoid_NHCWB16",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

392

)

393

AllocationQuantum = 16

394

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

395

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

396

self.shape = shape

397

self.storage_shape = shape

398

self.bandwidth_shape = shape

399

self.dtype = dtype

400

self.name = name

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

401

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

402

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

403

self.ops: List[Operation] = []

404

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

406

self.values: Optional[np.ndarray] = None

407

self.quant_values: Optional[np.ndarray] = None

408

self.compressed_values: Optional[np.ndarray] = None

409

self.compressed_values_substream_offsets: Optional[List] = None

410

self.mem_area: MemArea = MemArea.Unknown

411

self.mem_type: MemType = MemType.Unknown

412

self.format: TensorFormat = TensorFormat.Unknown

413

self.purpose: TensorPurpose = TensorPurpose.Unknown

414

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

415

self.alignment: int = Tensor.AllocationQuantum

416

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

417

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

418

self.storage_compression_scale: float = 1.0

419

self.bandwidth_compression_scale: float = 1.0

420

self.compression_scale_for_worst_weight_stream: float = 1.0

421

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

422

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

423

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

424

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

425

self.value_id: UUID = uuid.uuid4()

426

self.weight_compressed_offsets: List = []

427

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

428

self.brick_size: Tuple = (1, 1, 1, 1)

429

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

430

431

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

432

self.quantization: Optional[QuantizationParameters] = None

433

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

434

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

435

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

436

self.avoid_NHCWB16: bool = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

437

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

438

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

439

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

440

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

441

442

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

443

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

444

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

445

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

446

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

447

if self.element_size_bytes == 0:

448

return self.dtype.size_in_bits() / 8

449

return self.element_size_bytes

450

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

451

# Returns a copy, renamed to self.name + suffix

452

# The references to Operators will be empty when returned

453

# Depending on set_unique, the copy is shallow, or deep

454

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

455

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

456

if set_unique:

457

res = copy.deepcopy(self)

458

res.equivalence_id = uuid.uuid4()

459

else:

460

res = copy.copy(self)

461

res.storage_shape = list(self.storage_shape)

462

res.bandwidth_shape = list(self.bandwidth_shape)

463

if self.quantization is not None:

464

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

465

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

466

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

467

res.ops = []

468

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

469

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

470

return res

471

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

472

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

473

res = self.clone(suffix="_fast_storage")

474

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

475

res.mem_type = MemType.Scratch_fast

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

476

return res

477

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

478

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

479

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

480

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

481

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

482

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

483

self.storage_shape = src_tens.storage_shape

484

self.brick_size = src_tens.brick_size

485

self.weight_compression_scales = src_tens.weight_compression_scales

486

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

487

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

488

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

489

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

490

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

491

self.block_traversal = src_tens.block_traversal

492

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

493

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

494

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

495

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

503

if shape_len > 4:

504

return

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

505

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

506

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

507

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

508

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

509

if self.shape is None:

510

return

511

512

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

513

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

514

515

if fmt == TensorFormat.WeightsCompressed:

516

compression_ratio = 5 / 8

517

self.storage_compression_scale = compression_ratio

518

self.bandwidth_compression_scale = compression_ratio

519

self.compression_scale_for_worst_weight_stream = compression_ratio

520

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

521

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

522

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

527

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

528

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

533

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

534

return shape_fully_defined(self.shape)

535

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

536

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

537

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

538

if raw_size == 0:

539

raw_size = 1 # force it to take up space

540

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

541

return rounded_size

542

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

543

def storage_size_for_sub_purpose(

544

self, arch, sub_purpose: TensorSubPurpose, param_a: Optional[int] = None, param_b: Optional[int] = None

545

) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

546

alt_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

547

elems = shape_num_elements(alt_shape)

548

if elems is None:

549

return 0

550

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

551

raw_size = (

552

elems

553

* self.element_size()

554

* self.compression_scale_for_worst_weight_stream

555

* arch.weight_estimation_scaling

556

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

557

else:

Patrik Gustavsson

9baa4c3

2020-08-20 13:59:01 +0200

[diff] [blame]

558

# Rolling buffers are used for intermediate data in ifm streaming

559

# These will all use the NHCWB16 format, and need to be aligned to 16 in the C-dimension

560

if alt_shape[-1] % 16 != 0:

561

nhcwb16_shape = alt_shape[0:-1] + [numeric_util.round_up(alt_shape[-1], 16)]

562

elems = shape_num_elements(nhcwb16_shape)

563

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

564

raw_size = elems * self.element_size() * self.storage_compression_scale

565

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

566

return rounded_size

567

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

568

def storage_shape_for_sub_purpose(

569

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

570

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

571

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

572

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

573

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

574

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

575

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

576

else:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

577

shp = list(self.storage_shape)

578

if sub_purpose == TensorSubPurpose.RollingBufferX:

579

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

580

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

581

shp[0] = 1

582

shp[2] = min(shp[2], param_a)

583

elif sub_purpose == TensorSubPurpose.RollingBufferY:

584

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

585

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

586

shp[0] = 1

587

shp[1] = min(shp[1], param_a)

588

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

589

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

590

assert param_a is not None

591

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

592

shp[0] = 1

593

shp[2] = min(shp[2], param_a)

594

shp[1] = min(shp[1], param_b)

595

elif sub_purpose == TensorSubPurpose.Standard:

596

pass

597

else:

598

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

599

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

600

return shp

601

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

602

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

603

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

604

self.sub_purpose = sub_purpose

605

if sub_purpose == TensorSubPurpose.DoubleBuffer:

606

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

607

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

608

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

609

elems = shape_num_elements(self.bandwidth_shape)

610

if elems is None:

611

return 0

612

return elems * self.element_size() * self.bandwidth_compression_scale

613

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

614

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

615

return self.consumer_list

616

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

617

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, fm_shape: Shape4D) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

618

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

619

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

620

if self.storage_shape == []:

return (

1,

1,

1,

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

625

[self.address_for_coordinate(start_coord, shape=fm_shape.as_list()), None, None, None],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

626

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

627

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

628

storage_shape_4D = full_shape(4, self.storage_shape, 1)

629

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D[1])

630

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D[2])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

631

632

crossing_y = min(crossing_y, end_coord[1])

633

crossing_x = min(crossing_x, end_coord[2])

634

635

box_height0 = crossing_y - start_coord[1]

636

box_width = crossing_x - start_coord[2]

637

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

638

addresses: List = [None] * 4

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

639

addresses[0] = self.address_for_coordinate(start_coord, shape=fm_shape.as_list())

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

640

641

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

642

addresses[1] = self.address_for_coordinate(

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

643

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], shape=fm_shape.as_list()

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

644

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

645

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

646

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

647

addresses[2] = self.address_for_coordinate(

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

648

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], shape=fm_shape.as_list()

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

649

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

650

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

651

addresses[3] = self.address_for_coordinate(

patrik.gustavsson

2020-12-21 17:10:40 +0000

[diff] [blame]

652

[start_coord[0], crossing_y, crossing_x, start_coord[3]], shape=fm_shape.as_list()

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

653

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

654

655

return box_height0, box_height0, box_width, addresses

656

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

657

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, shape: Shape = None) -> int:

658

if shape is None:

659

shape = self.shape

660

offset = self.address_offset_for_coordinate(coord, shape, is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

661

assert offset is not None

662

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

663

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

664

def get_strides_and_coord(self, coord: Optional[Shape] = None) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

665

if coord is None:

666

coord = [0] * len(self.storage_shape)

667

668

augmented_coord = coord

669

augmented_shape = self.storage_shape

670

while len(augmented_shape) < 4:

671

augmented_shape = [1] + augmented_shape

672

673

while len(augmented_coord) < 4:

674

augmented_coord = [0] + augmented_coord

675

676

assert len(augmented_coord) == len(augmented_shape)

677

678

if self.format == TensorFormat.NHWC:

679

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

680

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

681

682

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

683

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

684

augmented_shape = augmented_shape[0:4] + [1]

685

augmented_coord = (

686

[augmented_coord[0], augmented_coord[3] // channel_divisor]

687

+ augmented_coord[1:3]

688

+ [augmented_coord[3] % channel_divisor]

689

)

690

691

if augmented_shape[1] == 0:

692

augmented_shape[1] = 1

693

694

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

695

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

696

return None, None

697

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

698

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

699

stride = self.element_size() * self.storage_compression_scale

700

701

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

702

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

703

for i in stride_order:

704

strides[i] = stride

705

stride *= augmented_shape[i]

706

else:

707

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

708

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

709

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

710

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

711

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

712

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

713

714

return strides, augmented_coord

715

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

716

def get_strides(self) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

717

strides, _ = self.get_strides_and_coord()

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

718

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

719

return strides

720

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

721

def needs_dma(self) -> bool:

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

722

return len(self.ops) == 1 and self.ops[0].type == Op.DMA

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

723

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

724

def get_dma_src_tensor(self) -> "Optional[Tensor]":

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

725

# For weight tensors that need DMA: returns the source tensor in Flash, else None

726

# Note: for DMA ops, Pass.weight_tensor is referring to the SRAM weight tensor

727

return self.ops[0].inputs[0] if self.needs_dma() else None

728

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

729

def find_npu_op(self) -> Optional[Operation]:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

730

# Returns the NPU operator that uses this tensor, excluding DMA operators.

731

for op in self.consumers():

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

732

if op.type == Op.DMA:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

733

return op.outputs[0].find_npu_op()

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

734

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

735

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

736

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

737

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

738

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

739

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

740

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

741

assert len(self.compressed_values) > 0

742

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

743

744

depth = coord[-1]

745

brick_depth = self.brick_size[-1]

746

# Clamp position at final element index

747

if depth > self.shape[-1]:

748

depth = self.shape[-1]

749

750

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

751

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

752

753

# Check boundaries on all but last weight set (which may be shorter

754

# than the brick we divided it up into)

755

if index < len(self.weight_compressed_offsets) - 1:

756

# There are no half-way points in the weights

757

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

758

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

762

def size_of_compressed_stream(self, index: int) -> int:

763

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

764

assert 0 <= index < len(self.compressed_values)

765

return len(self.compressed_values[index])

766

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

767

def is_last_index_in_compressed_stream(self, index: int) -> bool:

768

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

769

assert 0 <= index < len(self.compressed_values)

770

return index == len(self.compressed_values) - 1

771

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

772

def address_offset_for_coordinate(self, orig_coord: Shape, shape: Shape, is_top_box: bool = False) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

address_offset = 0

coord = orig_coord

coord = coord[-len(self.storage_shape) :]

777

778

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

779

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

780

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

781

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

782

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

783

assert c >= 0 and c < shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

784

785

if self.format == TensorFormat.WeightsCompressed:

786

if len(self.weight_compressed_offsets) == 0:

787

return 0

788

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

789

if self.needs_dma() and self.sub_purpose == TensorSubPurpose.DoubleBuffer:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

790

depth = orig_coord[-1]

791

brick_depth = self.brick_size[-1]

792

# Clamp position at final element index

793

if depth > self.shape[-1]:

794

depth = self.shape[-1]

795

796

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

797

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

798

index = index % 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

799

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

800

801

if len(self.compressed_values) <= 2:

802

if is_top_box and index == 0:

803

for cv in self.compressed_values:

804

address_offset += len(cv)

805

else:

806

address_offset = index * len(self.compressed_values[0])

807

else:

808

if is_top_box and index == 0:

809

address_offset = self.storage_shape[-1]

810

else:

811

address_offset = index * (self.storage_shape[-1] // 2)

812

else:

813

index = self.compressed_stream_index_from_coord(orig_coord)

814

assert index < len(self.weight_compressed_offsets)

815

address_offset = self.weight_compressed_offsets[index]

816

else:

817

if is_top_box:

818

coord = [c - 1 for c in coord]

819

820

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

821

coord = [c % self.storage_shape[idx] for idx, c in enumerate(coord)]

822

823

strides, augmented_coord = self.get_strides_and_coord(coord)

if strides is None:

return None

if is_top_box:

address_offset += 1 * strides[-1] # one element

829

830

address_offset += np.dot(augmented_coord, strides)

831

832

assert address_offset >= 0

833

assert address_offset <= self.storage_size()

834

return address_offset

835

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

836

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

837

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

838

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

839

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

840

return self.equivalence_id == tens.equivalence_id

841

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

842

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

843

self.shape = shape

844

self.storage_shape = shape

845

self.bandwidth_shape = shape

846

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

847

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

848

d = len(self.shape)

849

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

850

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

851

elif d == 2:

852

return [self.shape[0], 1, 1, self.shape[1]]

853

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

854

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

855

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

856

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

857

# a tensor is quantized if it has an integral type and it contains valid quantization params

858

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

859

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

860

return False

861

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

862

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

863

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

864

def __lt__(self, other: "Tensor") -> bool:

865

return self.equivalence_id < other.equivalence_id

866

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

867

def __str__(self):

868

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

869

870

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

871

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

872

def error(self, msg):

873

"""

874

Raises a VelaError exception for errors encountered when parsing a Tensor

875

876

:param self: Tensor object that resulted in the error

877

:param msg: str object that contains a description of the specific error encountered

878

"""

879

880

def _print_operators(ops):

881

lines = []

882

for idx, op in enumerate(ops):

883

op_type = getattr(op, "type", "Not an Operation")

884

op_id = getattr(op, "op_index", "-")

885

lines.append(f" {idx} = {op_type} ({op_id})")

886

return lines

887

888

lines = [f"Invalid {self.name} tensor. {msg}"]

889

890

lines += [" Driving operators:"]

891

lines += _print_operators(self.ops)

892

893

lines += [" Consuming operators:"]

894

lines += _print_operators(self.consumer_list)

895

896

raise VelaError("\n".join(lines))

897

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

898

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

899

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

900

# checks that the scaling of two quantized tensors are equal

901

Tim Hall