Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

1

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

24

from typing import Dict

25

from typing import List

26

from typing import Optional

27

from typing import Tuple

28

from typing import Union

29

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

Michael McGeagh

2020-12-02 15:29:22 +0000

[diff] [blame]

33

from . import errors # Import this way due to cyclic imports

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

34

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

37

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

38

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

39

from .operation import Operation

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

40

41

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

42

43

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

44

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

51

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

52

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

53

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

54

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

55

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

56

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

57

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

58

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

59

def all():

60

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

66

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

72

return self.name

73

74

def identifier_name(self):

75

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

80

81

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

82

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

88

Shram = 5 # for LUT

89

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

90

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

91

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

93

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

94

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

95

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

96

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

97

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

98

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

a0c3624

2020-06-03 15:43:31 +0200

[diff] [blame]

110

LUT = 4

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

111

FSBias = 5

112

Size = 6

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

113

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

114

def display_name(self) -> str:

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

115

return ("Unknown", "Weights", "FeatureMap", "Scratch", "LUT", "FastStorageBias", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

116

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

117

def identifier_name(self) -> str:

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

118

return ("unknown", "weights", "feature_map", "scratch", "lut", "fast_storage_bias", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

119

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

120

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

121

def all():

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

122

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

124

125

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

132

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

133

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

134

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

135

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

136

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

137

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

138

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

139

def all():

140

return (

141

TensorSubPurpose.Standard,

142

TensorSubPurpose.DoubleBuffer,

143

TensorSubPurpose.RollingBufferX,

144

TensorSubPurpose.RollingBufferY,

145

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

150

Unknown = 0

151

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

166

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

177

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

187

new_shp = list(shp)

188

189

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

190

for i in range(-1, -len(shp) - 1, -1):

191

if new_shp[i] is not None:

192

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

196

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

197

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

198

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

202

class QuantizationParameters:

203

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

204

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

205

def __init__(

206

self,

207

min: Union[float, np.ndarray, None] = None,

208

max: Union[float, np.ndarray, None] = None,

209

num_bits=None,

210

narrow_range=None,

211

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

216

self.narrow_range = narrow_range

217

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

218

self.scale_f32: Union[float, np.ndarray, None] = None

219

self.zero_point: Union[int, np.ndarray, None] = None

220

self.quant_min: Optional[float] = None

221

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

222

223

def __str__(self):

224

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

234

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

235

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

240

res.narrow_range = self.narrow_range

241

242

res.scale_f32 = self.scale_f32

243

res.zero_point = self.zero_point

244

res.quant_min = self.quant_min

245

res.quant_max = self.quant_max

246

return res

247

248

def dequantize(self, values):

249

if self.zero_point.size == 1 and self.scale_f32.size == 1:

250

# same scale is used for all values

251

res = (values.astype(np.float64) - self.zero_point) * self.scale_f32

252

else:

253

# a different scale is used for different sets of values

254

values_as_float = values.astype(np.float64)

255

256

# this is not compatible with the format of depthwise weights,

257

# where input is at index 3 (Output, Kh, Kw, Input)

258

# return the quantized values

259

return np.ndarray((values_as_float.shape))

260

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

261

return res

262

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

263

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

264

# quantisation parameter scaling is not equal if 'other' is None because

265

# it implies that the tensor it belongs to is not quantised. otherwise,

266

# it depends upon whether the scale and zero point are equal

267

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

268

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

269

return False

270

271

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

272

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

273

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

274

# quantisation parameters are consider valid if they have a scale and zero point

275

276

return None not in (self.scale_f32, self.zero_point)

277

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

278

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

279

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

280

for attr in ("scale_f32", "zero_point", "min", "max"):

281

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

285

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

286

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

292

purpose: TensorPurpose = TensorPurpose.Unknown,

293

quantization: QuantizationParameters = None,

294

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

295

# Tensor

296

const_tensor = Tensor(shape, dtype, name + "_0")

297

const_tensor.purpose = purpose

298

const_tensor.quantization = quantization

299

const_tensor.values = np.array(values, dtype=value_dtype)

Jacob Bohlin

a41cd4d

2020-08-26 18:21:28 +0200

[diff] [blame]

300

const_tensor.quant_values = np.frombuffer(const_tensor.values.tobytes(), dtype=np.uint8)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

301

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

302

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

303

const_op.set_output_tensor(const_tensor)

return const_tensor

def create_reshape_tensor(tens, shape, ifm_reshape=True):

308

if shape == tens.shape:

309

return tens

310

# Tensors

311

name = tens.name + "_reshape"

312

reshape_ifm = tens

313

reshape_ofm = tens.clone("_reshaped")

314

reshape_ofm.set_all_shapes(shape)

315

if not ifm_reshape:

316

reshape_ifm, reshape_ofm = reshape_ofm, reshape_ifm

317

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

318

reshape_op = Operation(Op.Reshape, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

319

reshape_op.attrs["new_shape"] = shape

320

reshape_op.add_input_tensor(reshape_ifm)

321

reshape_op.add_input_tensor(create_const_tensor(name + "_shape", [1], DataType.int32, shape))

322

reshape_op.set_output_tensor(reshape_ofm)

323

return reshape_ofm if ifm_reshape else reshape_ifm

324

325

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

326

# class that keeps track of all tensor addresses in the different memory types

327

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

328

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

329

330

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

331

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

332

return cls.address_map[tens_id].get(mem_type)

333

334

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

335

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

336

# Check previous address if there is one

337

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

338

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

339

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

340

341

# Set tensor's address for memory type

342

cls.address_map[tens_id][mem_type] = address

343

344

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

"ops",

"consumer_list",

"values",

"quant_values",

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

357

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

358

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

359

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

365

"storage_compression_scale",

366

"bandwidth_compression_scale",

367

"compression_scale_for_worst_weight_stream",

368

"weight_compression_scales",

369

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

370

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

371

"storage_rounding_quantum",

372

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

"quantization",

374

"weight_compressed_offsets",

375

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

376

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

377

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

378

"resampling_mode",

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

379

"avoid_NHCWB16",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

380

)

381

AllocationQuantum = 16

382

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

383

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

384

self.shape = shape

385

self.storage_shape = shape

386

self.bandwidth_shape = shape

387

self.dtype = dtype

388

self.name = name

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

389

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

390

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

391

self.ops: List[Operation] = []

392

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

393

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

394

self.values: Optional[np.ndarray] = None

395

self.quant_values: Optional[np.ndarray] = None

396

self.compressed_values: Optional[np.ndarray] = None

397

self.compressed_values_substream_offsets: Optional[List] = None

398

self.mem_area: MemArea = MemArea.Unknown

399

self.mem_type: MemType = MemType.Unknown

400

self.format: TensorFormat = TensorFormat.Unknown

401

self.purpose: TensorPurpose = TensorPurpose.Unknown

402

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

403

self.alignment: int = Tensor.AllocationQuantum

404

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

406

self.storage_compression_scale: float = 1.0

407

self.bandwidth_compression_scale: float = 1.0

408

self.compression_scale_for_worst_weight_stream: float = 1.0

409

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

410

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

411

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

412

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

413

self.value_id: UUID = uuid.uuid4()

414

self.weight_compressed_offsets: List = []

415

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

416

self.brick_size: Tuple = (1, 1, 1, 1)

417

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

418

419

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

420

self.quantization: Optional[QuantizationParameters] = None

421

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

422

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

423

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

424

self.avoid_NHCWB16: bool = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

425

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

426

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

427

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

428

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

429

430

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

431

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

432

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

433

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

434

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

435

if self.element_size_bytes == 0:

436

return self.dtype.size_in_bits() / 8

437

return self.element_size_bytes

438

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

439

# Returns a copy, renamed to self.name + suffix

440

# The references to Operators will be empty when returned

441

# Depending on set_unique, the copy is shallow, or deep

442

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

443

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

444

if set_unique:

445

res = copy.deepcopy(self)

446

res.equivalence_id = uuid.uuid4()

447

else:

448

res = copy.copy(self)

449

res.storage_shape = list(self.storage_shape)

450

res.bandwidth_shape = list(self.bandwidth_shape)

451

if self.quantization is not None:

452

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

453

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

454

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

455

res.ops = []

456

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

457

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

458

return res

459

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

460

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

461

res = self.clone(suffix="_fast_storage")

462

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

463

res.mem_type = MemType.Scratch_fast

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

464

return res

465

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

466

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

467

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

468

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

469

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

470

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

471

self.storage_shape = src_tens.storage_shape

472

self.brick_size = src_tens.brick_size

473

self.weight_compression_scales = src_tens.weight_compression_scales

474

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

475

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

476

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

477

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

478

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

479

self.block_traversal = src_tens.block_traversal

480

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

481

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

482

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

483

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

491

if shape_len > 4:

492

return

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

493

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

494

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

495

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

496

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

497

if self.shape is None:

498

return

499

500

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

501

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

502

503

if fmt == TensorFormat.WeightsCompressed:

504

compression_ratio = 5 / 8

505

self.storage_compression_scale = compression_ratio

506

self.bandwidth_compression_scale = compression_ratio

507

self.compression_scale_for_worst_weight_stream = compression_ratio

508

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

509

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

510

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

515

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

516

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

521

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

522

return shape_fully_defined(self.shape)

523

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

524

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

525

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

526

if raw_size == 0:

527

raw_size = 1 # force it to take up space

528

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

529

return rounded_size

530

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

531

def storage_size_for_sub_purpose(

532

self, arch, sub_purpose: TensorSubPurpose, param_a: Optional[int] = None, param_b: Optional[int] = None

533

) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

534

alt_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

535

elems = shape_num_elements(alt_shape)

536

if elems is None:

537

return 0

538

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

539

raw_size = (

540

elems

541

* self.element_size()

542

* self.compression_scale_for_worst_weight_stream

543

* arch.weight_estimation_scaling

544

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

545

else:

Patrik Gustavsson

9baa4c3

2020-08-20 13:59:01 +0200

[diff] [blame]

546

# Rolling buffers are used for intermediate data in ifm streaming

547

# These will all use the NHCWB16 format, and need to be aligned to 16 in the C-dimension

548

if alt_shape[-1] % 16 != 0:

549

nhcwb16_shape = alt_shape[0:-1] + [numeric_util.round_up(alt_shape[-1], 16)]

550

elems = shape_num_elements(nhcwb16_shape)

551

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

552

raw_size = elems * self.element_size() * self.storage_compression_scale

553

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

554

return rounded_size

555

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

556

def storage_shape_for_sub_purpose(

557

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

558

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

559

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

560

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

561

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

562

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

563

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

564

else:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

565

shp = list(self.storage_shape)

566

if sub_purpose == TensorSubPurpose.RollingBufferX:

567

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

568

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

569

shp[0] = 1

570

shp[2] = min(shp[2], param_a)

571

elif sub_purpose == TensorSubPurpose.RollingBufferY:

572

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

573

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

574

shp[0] = 1

575

shp[1] = min(shp[1], param_a)

576

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

577

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

578

assert param_a is not None

579

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

580

shp[0] = 1

581

shp[2] = min(shp[2], param_a)

582

shp[1] = min(shp[1], param_b)

583

elif sub_purpose == TensorSubPurpose.Standard:

584

pass

585

else:

586

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

587

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

588

return shp

589

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

590

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

591

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

592

self.sub_purpose = sub_purpose

593

if sub_purpose == TensorSubPurpose.DoubleBuffer:

594

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

595

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

596

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

597

elems = shape_num_elements(self.bandwidth_shape)

598

if elems is None:

599

return 0

600

return elems * self.element_size() * self.bandwidth_compression_scale

601

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

602

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

603

return self.consumer_list

604

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

605

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

606

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

607

608

if len(start_coord) < 4:

box_height0 = 1

box_width = 1

if len(start_coord) >= 2:

613

box_width = end_coord[-2] - start_coord[-2]

614

615

return box_height0, box_height0, box_width, [self.address_for_coordinate(start_coord), None, None, None]

616

617

crossing_y = numeric_util.round_up(start_coord[1] + 1, self.storage_shape[1])

618

crossing_x = numeric_util.round_up(start_coord[2] + 1, self.storage_shape[2])

619

620

crossing_y = min(crossing_y, end_coord[1])

621

crossing_x = min(crossing_x, end_coord[2])

622

623

box_height0 = crossing_y - start_coord[1]

624

box_width = crossing_x - start_coord[2]

625

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

626

addresses: List = [None] * 4

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

627

addresses[0] = self.address_for_coordinate(start_coord)

628

629

if end_coord[2] > crossing_x:

630

addresses[1] = self.address_for_coordinate([start_coord[0], start_coord[1], crossing_x, start_coord[3]])

Michael McGeagh

7a6f843

2020-12-02 15:29:22 +0000

[diff] [blame]

631

raise errors.UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

632

if end_coord[1] > crossing_y:

633

addresses[2] = self.address_for_coordinate([start_coord[0], crossing_y, start_coord[2], start_coord[3]])

634

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

635

addresses[3] = self.address_for_coordinate([start_coord[0], crossing_y, crossing_x, start_coord[3]])

636

637

return box_height0, box_height0, box_width, addresses

638

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

639

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False) -> int:

640

offset = self.address_offset_for_coordinate(coord, is_top_box)

641

assert offset is not None

642

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

643

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

644

def get_strides_and_coord(self, coord: Optional[Shape] = None) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

645

if coord is None:

646

coord = [0] * len(self.storage_shape)

647

648

augmented_coord = coord

649

augmented_shape = self.storage_shape

650

while len(augmented_shape) < 4:

651

augmented_shape = [1] + augmented_shape

652

653

while len(augmented_coord) < 4:

654

augmented_coord = [0] + augmented_coord

655

656

assert len(augmented_coord) == len(augmented_shape)

657

658

if self.format == TensorFormat.NHWC:

659

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

660

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

661

662

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

663

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

664

augmented_shape = augmented_shape[0:4] + [1]

665

augmented_coord = (

666

[augmented_coord[0], augmented_coord[3] // channel_divisor]

667

+ augmented_coord[1:3]

668

+ [augmented_coord[3] % channel_divisor]

669

)

670

671

if augmented_shape[1] == 0:

672

augmented_shape[1] = 1

673

674

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

675

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

676

return None, None

677

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

678

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

679

stride = self.element_size() * self.storage_compression_scale

680

681

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

682

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

683

for i in stride_order:

684

strides[i] = stride

685

stride *= augmented_shape[i]

686

else:

687

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

688

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

689

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

690

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

691

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

692

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

693

694

return strides, augmented_coord

695

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

696

def get_strides(self) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

697

strides, _ = self.get_strides_and_coord()

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

698

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

699

return strides

700

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

701

def needs_dma(self) -> bool:

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

702

return len(self.ops) == 1 and self.ops[0].type == Op.DMA

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

703

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

704

def get_dma_src_tensor(self) -> "Optional[Tensor]":

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

705

# For weight tensors that need DMA: returns the source tensor in Flash, else None

706

# Note: for DMA ops, Pass.weight_tensor is referring to the SRAM weight tensor

707

return self.ops[0].inputs[0] if self.needs_dma() else None

708

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

709

def find_npu_op(self) -> Optional[Operation]:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

710

# Returns the NPU operator that uses this tensor, excluding DMA operators.

711

for op in self.consumers():

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

712

if op.type == Op.DMA:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

713

return op.outputs[0].find_npu_op()

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

714

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

715

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

716

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

717

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

718

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

719

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

720

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

721

assert len(self.compressed_values) > 0

722

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

723

724

depth = coord[-1]

725

brick_depth = self.brick_size[-1]

726

# Clamp position at final element index

727

if depth > self.shape[-1]:

728

depth = self.shape[-1]

729

730

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

731

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

732

733

# Check boundaries on all but last weight set (which may be shorter

734

# than the brick we divided it up into)

735

if index < len(self.weight_compressed_offsets) - 1:

736

# There are no half-way points in the weights

737

if (depth % brick_depth) != 0:

Michael McGeagh

7a6f843

2020-12-02 15:29:22 +0000

[diff] [blame]

738

raise errors.UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

742

def size_of_compressed_stream(self, index: int) -> int:

743

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

744

assert 0 <= index < len(self.compressed_values)

745

return len(self.compressed_values[index])

746

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

747

def is_last_index_in_compressed_stream(self, index: int) -> bool:

748

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

749

assert 0 <= index < len(self.compressed_values)

750

return index == len(self.compressed_values) - 1

751

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

752

def address_offset_for_coordinate(self, orig_coord: Shape, is_top_box: bool = False) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

address_offset = 0

coord = orig_coord

coord = coord[-len(self.storage_shape) :]

757

758

if self.sub_purpose == TensorSubPurpose.Standard:

759

for idx, c in enumerate(coord):

760

if is_top_box:

761

assert c > 0 and c <= self.shape[idx]

762

else:

763

assert c >= 0 and c < self.shape[idx]

764

765

if self.format == TensorFormat.WeightsCompressed:

766

if len(self.weight_compressed_offsets) == 0:

767

return 0

768

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

769

if self.needs_dma() and self.sub_purpose == TensorSubPurpose.DoubleBuffer:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

770

depth = orig_coord[-1]

771

brick_depth = self.brick_size[-1]

772

# Clamp position at final element index

773

if depth > self.shape[-1]:

774

depth = self.shape[-1]

775

776

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

777

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

778

index = index % 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

779

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

780

781

if len(self.compressed_values) <= 2:

782

if is_top_box and index == 0:

783

for cv in self.compressed_values:

784

address_offset += len(cv)

785

else:

786

address_offset = index * len(self.compressed_values[0])

787

else:

788

if is_top_box and index == 0:

789

address_offset = self.storage_shape[-1]

790

else:

791

address_offset = index * (self.storage_shape[-1] // 2)

792

else:

793

index = self.compressed_stream_index_from_coord(orig_coord)

794

assert index < len(self.weight_compressed_offsets)

795

address_offset = self.weight_compressed_offsets[index]

796

else:

797

if is_top_box:

798

coord = [c - 1 for c in coord]

799

800

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

801

coord = [c % self.storage_shape[idx] for idx, c in enumerate(coord)]

802

803

strides, augmented_coord = self.get_strides_and_coord(coord)

if strides is None:

return None

if is_top_box:

address_offset += 1 * strides[-1] # one element

809

810

address_offset += np.dot(augmented_coord, strides)

811

812

assert address_offset >= 0

813

assert address_offset <= self.storage_size()

814

return address_offset

815

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

816

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

817

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

818

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

819

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

820

return self.equivalence_id == tens.equivalence_id

821

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

822

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

823

self.shape = shape

824

self.storage_shape = shape

825

self.bandwidth_shape = shape

826

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

827

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

828

d = len(self.shape)

829

if d in (1, 3):

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

830

return numeric_util.full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

831

elif d == 2:

832

return [self.shape[0], 1, 1, self.shape[1]]

833

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

834

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

835

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

836

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

837

# a tensor is quantized if it has an integral type and it contains valid quantization params

838

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

839

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

840

return False

841

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

842

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

843

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

844

def __str__(self):

845

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

846

847

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

848

849

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

850

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

851

# checks that the scaling of two quantized tensors are equal

852

Tim Hall