Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

1

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

22

from functools import lru_cache

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

23

from typing import Dict

24

from typing import List

25

from typing import Optional

26

from typing import Tuple

27

from typing import Union

28

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

33

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

34

from .data_type import DataType

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

35

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

36

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

37

from .operation import Operation

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

38

39

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

40

41

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

42

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

49

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

50

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

51

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

52

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

53

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

54

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

56

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

def all():

58

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

64

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

70

Shram = 5 # for LUT

71

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

72

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

73

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

74

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

75

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

76

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

77

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

78

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

79

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

80

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

81

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

a0c3624

2020-06-03 15:43:31 +0200

[diff] [blame]

92

LUT = 4

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

93

FSBias = 5

94

Size = 6

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

95

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

96

def display_name(self) -> str:

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

97

return ("Unknown", "Weights", "FeatureMap", "Scratch", "LUT", "FastStorageBias", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

98

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

99

def identifier_name(self) -> str:

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

100

return ("unknown", "weights", "feature_map", "scratch", "lut", "fast_storage_bias", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

101

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

102

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

103

def all():

Andreas Nevalainen

2020-10-28 15:42:08 +0100

[diff] [blame]

104

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

105

106

107

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

114

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

115

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

116

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

117

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

119

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

120

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

121

def all():

122

return (

123

TensorSubPurpose.Standard,

124

TensorSubPurpose.DoubleBuffer,

125

TensorSubPurpose.RollingBufferX,

126

TensorSubPurpose.RollingBufferY,

127

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

132

Unknown = 0

133

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

148

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

159

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

168

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

169

new_shp = list(shp)

170

171

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

172

for i in range(-1, -len(shp) - 1, -1):

173

if new_shp[i] is not None:

174

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

178

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

179

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

180

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

184

class QuantizationParameters:

185

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

186

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

187

def __init__(

188

self,

189

min: Union[float, np.ndarray, None] = None,

190

max: Union[float, np.ndarray, None] = None,

191

num_bits=None,

192

narrow_range=None,

193

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

198

self.narrow_range = narrow_range

199

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

200

self.scale_f32: Union[float, np.ndarray, None] = None

201

self.zero_point: Union[int, np.ndarray, None] = None

202

self.quant_min: Optional[float] = None

203

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

204

205

def __str__(self):

206

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

216

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

217

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

222

res.narrow_range = self.narrow_range

223

224

res.scale_f32 = self.scale_f32

225

res.zero_point = self.zero_point

226

res.quant_min = self.quant_min

227

res.quant_max = self.quant_max

228

return res

229

230

def dequantize(self, values):

231

if self.zero_point.size == 1 and self.scale_f32.size == 1:

232

# same scale is used for all values

233

res = (values.astype(np.float64) - self.zero_point) * self.scale_f32

234

else:

235

# a different scale is used for different sets of values

236

values_as_float = values.astype(np.float64)

237

238

# this is not compatible with the format of depthwise weights,

239

# where input is at index 3 (Output, Kh, Kw, Input)

240

# return the quantized values

241

return np.ndarray((values_as_float.shape))

242

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

243

return res

244

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

245

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

246

# quantisation parameter scaling is not equal if 'other' is None because

247

# it implies that the tensor it belongs to is not quantised. otherwise,

248

# it depends upon whether the scale and zero point are equal

249

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

250

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

251

return False

252

253

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

254

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

255

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

256

# quantisation parameters are consider valid if they have a scale and zero point

257

258

return None not in (self.scale_f32, self.zero_point)

259

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

260

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

261

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

262

for attr in ("scale_f32", "zero_point", "min", "max"):

263

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

267

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

268

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

274

purpose: TensorPurpose = TensorPurpose.Unknown,

275

quantization: QuantizationParameters = None,

276

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

277

# Tensor

278

const_tensor = Tensor(shape, dtype, name + "_0")

279

const_tensor.purpose = purpose

280

const_tensor.quantization = quantization

281

const_tensor.values = np.array(values, dtype=value_dtype)

Jacob Bohlin

a41cd4d

2020-08-26 18:21:28 +0200

[diff] [blame]

282

const_tensor.quant_values = np.frombuffer(const_tensor.values.tobytes(), dtype=np.uint8)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

283

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

284

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

285

const_op.set_output_tensor(const_tensor)

return const_tensor

def create_reshape_tensor(tens, shape, ifm_reshape=True):

290

if shape == tens.shape:

291

return tens

292

# Tensors

293

name = tens.name + "_reshape"

294

reshape_ifm = tens

295

reshape_ofm = tens.clone("_reshaped")

296

reshape_ofm.set_all_shapes(shape)

297

if not ifm_reshape:

298

reshape_ifm, reshape_ofm = reshape_ofm, reshape_ifm

299

# Operator

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

300

reshape_op = Operation(Op.Reshape, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

301

reshape_op.attrs["new_shape"] = shape

302

reshape_op.add_input_tensor(reshape_ifm)

303

reshape_op.add_input_tensor(create_const_tensor(name + "_shape", [1], DataType.int32, shape))

304

reshape_op.set_output_tensor(reshape_ofm)

305

return reshape_ofm if ifm_reshape else reshape_ifm

306

307

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

308

# class that keeps track of all tensor addresses in the different memory types

309

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

310

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

311

312

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

313

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

314

return cls.address_map[tens_id].get(mem_type)

315

316

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

317

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

318

# Check previous address if there is one

319

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

320

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

321

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

322

323

# Set tensor's address for memory type

324

cls.address_map[tens_id][mem_type] = address

325

326

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

"ops",

"consumer_list",

"values",

"quant_values",

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

339

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

340

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

341

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

347

"storage_compression_scale",

348

"bandwidth_compression_scale",

349

"compression_scale_for_worst_weight_stream",

350

"weight_compression_scales",

351

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

352

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

353

"storage_rounding_quantum",

354

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

355

"quantization",

356

"weight_compressed_offsets",

357

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

358

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

359

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

360

"resampling_mode",

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

361

"avoid_NHCWB16",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

362

)

363

AllocationQuantum = 16

364

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

365

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

366

self.shape = shape

367

self.storage_shape = shape

368

self.bandwidth_shape = shape

369

self.dtype = dtype

370

self.name = name

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

371

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

372

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

373

self.ops: List[Operation] = []

374

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

375

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

376

self.values: Optional[np.ndarray] = None

377

self.quant_values: Optional[np.ndarray] = None

378

self.compressed_values: Optional[np.ndarray] = None

379

self.compressed_values_substream_offsets: Optional[List] = None

380

self.mem_area: MemArea = MemArea.Unknown

381

self.mem_type: MemType = MemType.Unknown

382

self.format: TensorFormat = TensorFormat.Unknown

383

self.purpose: TensorPurpose = TensorPurpose.Unknown

384

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

385

self.alignment: int = Tensor.AllocationQuantum

386

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

387

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

388

self.storage_compression_scale: float = 1.0

389

self.bandwidth_compression_scale: float = 1.0

390

self.compression_scale_for_worst_weight_stream: float = 1.0

391

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

392

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

393

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

394

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

395

self.value_id: UUID = uuid.uuid4()

396

self.weight_compressed_offsets: List = []

397

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

398

self.brick_size: Tuple = (1, 1, 1, 1)

399

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

400

401

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

402

self.quantization: Optional[QuantizationParameters] = None

403

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

404

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

406

self.avoid_NHCWB16: bool = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

407

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

408

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

409

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

410

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

411

412

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

413

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

414

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

415

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

416

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

417

if self.element_size_bytes == 0:

418

return self.dtype.size_in_bits() / 8

419

return self.element_size_bytes

420

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

421

# Returns a copy, renamed to self.name + suffix

422

# The references to Operators will be empty when returned

423

# Depending on set_unique, the copy is shallow, or deep

424

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

425

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

426

if set_unique:

427

res = copy.deepcopy(self)

428

res.equivalence_id = uuid.uuid4()

429

else:

430

res = copy.copy(self)

431

res.storage_shape = list(self.storage_shape)

432

res.bandwidth_shape = list(self.bandwidth_shape)

433

if self.quantization is not None:

434

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

435

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

436

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

437

res.ops = []

438

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

439

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

440

return res

441

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

442

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

443

res = self.clone(suffix="_fast_storage")

444

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

445

res.mem_type = MemType.Scratch_fast

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

446

return res

447

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

448

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

449

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

450

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

451

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

452

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

453

self.storage_shape = src_tens.storage_shape

454

self.brick_size = src_tens.brick_size

455

self.weight_compression_scales = src_tens.weight_compression_scales

456

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

457

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

458

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

459

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

460

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

461

self.block_traversal = src_tens.block_traversal

462

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

463

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

464

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

465

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

473

if shape_len > 4:

474

return

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

475

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

476

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

477

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

478

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

479

if self.shape is None:

480

return

481

482

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

483

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

484

485

if fmt == TensorFormat.WeightsCompressed:

486

compression_ratio = 5 / 8

487

self.storage_compression_scale = compression_ratio

488

self.bandwidth_compression_scale = compression_ratio

489

self.compression_scale_for_worst_weight_stream = compression_ratio

490

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

491

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

492

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

497

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

498

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

503

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

504

return shape_fully_defined(self.shape)

505

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

506

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

507

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

508

if raw_size == 0:

509

raw_size = 1 # force it to take up space

510

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

511

return rounded_size

512

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

513

def storage_size_for_sub_purpose(

514

self, arch, sub_purpose: TensorSubPurpose, param_a: Optional[int] = None, param_b: Optional[int] = None

515

) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

516

alt_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

517

elems = shape_num_elements(alt_shape)

518

if elems is None:

519

return 0

520

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

521

raw_size = (

522

elems

523

* self.element_size()

524

* self.compression_scale_for_worst_weight_stream

525

* arch.weight_estimation_scaling

526

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

527

else:

Patrik Gustavsson

9baa4c3

2020-08-20 13:59:01 +0200

[diff] [blame]

528

# Rolling buffers are used for intermediate data in ifm streaming

529

# These will all use the NHCWB16 format, and need to be aligned to 16 in the C-dimension

530

if alt_shape[-1] % 16 != 0:

531

nhcwb16_shape = alt_shape[0:-1] + [numeric_util.round_up(alt_shape[-1], 16)]

532

elems = shape_num_elements(nhcwb16_shape)

533

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

534

raw_size = elems * self.element_size() * self.storage_compression_scale

535

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

536

return rounded_size

537

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

538

def storage_shape_for_sub_purpose(

539

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

540

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

541

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

542

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

543

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

544

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

545

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

546

else:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

547

shp = list(self.storage_shape)

548

if sub_purpose == TensorSubPurpose.RollingBufferX:

549

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

550

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

551

shp[0] = 1

552

shp[2] = min(shp[2], param_a)

553

elif sub_purpose == TensorSubPurpose.RollingBufferY:

554

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

555

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

556

shp[0] = 1

557

shp[1] = min(shp[1], param_a)

558

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

559

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

560

assert param_a is not None

561

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

562

shp[0] = 1

563

shp[2] = min(shp[2], param_a)

564

shp[1] = min(shp[1], param_b)

565

elif sub_purpose == TensorSubPurpose.Standard:

566

pass

567

else:

568

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

569

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

570

return shp

571

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

572

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

573

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

574

self.sub_purpose = sub_purpose

575

if sub_purpose == TensorSubPurpose.DoubleBuffer:

576

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

577

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

578

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

579

elems = shape_num_elements(self.bandwidth_shape)

580

if elems is None:

581

return 0

582

return elems * self.element_size() * self.bandwidth_compression_scale

583

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

584

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

585

return self.consumer_list

586

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

587

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

588

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

589

590

if len(start_coord) < 4:

box_height0 = 1

box_width = 1

if len(start_coord) >= 2:

595

box_width = end_coord[-2] - start_coord[-2]

596

597

return box_height0, box_height0, box_width, [self.address_for_coordinate(start_coord), None, None, None]

598

599

crossing_y = numeric_util.round_up(start_coord[1] + 1, self.storage_shape[1])

600

crossing_x = numeric_util.round_up(start_coord[2] + 1, self.storage_shape[2])

601

602

crossing_y = min(crossing_y, end_coord[1])

603

crossing_x = min(crossing_x, end_coord[2])

604

605

box_height0 = crossing_y - start_coord[1]

606

box_width = crossing_x - start_coord[2]

607

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

608

addresses: List = [None] * 4

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

609

addresses[0] = self.address_for_coordinate(start_coord)

610

611

if end_coord[2] > crossing_x:

612

addresses[1] = self.address_for_coordinate([start_coord[0], start_coord[1], crossing_x, start_coord[3]])

613

raise Exception("Striping in vertical direction is not supported")

614

if end_coord[1] > crossing_y:

615

addresses[2] = self.address_for_coordinate([start_coord[0], crossing_y, start_coord[2], start_coord[3]])

616

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

617

addresses[3] = self.address_for_coordinate([start_coord[0], crossing_y, crossing_x, start_coord[3]])

618

619

return box_height0, box_height0, box_width, addresses

620

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

621

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False) -> int:

622

offset = self.address_offset_for_coordinate(coord, is_top_box)

623

assert offset is not None

624

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

625

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

626

def get_strides_and_coord(self, coord: Optional[Shape] = None) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

627

if coord is None:

628

coord = [0] * len(self.storage_shape)

629

630

augmented_coord = coord

631

augmented_shape = self.storage_shape

632

while len(augmented_shape) < 4:

633

augmented_shape = [1] + augmented_shape

634

635

while len(augmented_coord) < 4:

636

augmented_coord = [0] + augmented_coord

637

638

assert len(augmented_coord) == len(augmented_shape)

639

640

if self.format == TensorFormat.NHWC:

641

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

642

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

643

644

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

645

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

646

augmented_shape = augmented_shape[0:4] + [1]

647

augmented_coord = (

648

[augmented_coord[0], augmented_coord[3] // channel_divisor]

649

+ augmented_coord[1:3]

650

+ [augmented_coord[3] % channel_divisor]

651

)

652

653

if augmented_shape[1] == 0:

654

augmented_shape[1] = 1

655

656

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

657

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

658

return None, None

659

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

660

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

661

stride = self.element_size() * self.storage_compression_scale

662

663

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

664

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

665

for i in stride_order:

666

strides[i] = stride

667

stride *= augmented_shape[i]

668

else:

669

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

670

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

671

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

672

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

673

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

674

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

675

676

return strides, augmented_coord

677

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

678

def get_strides(self) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

679

strides, _ = self.get_strides_and_coord()

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

680

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

681

return strides

682

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

683

def needs_dma(self) -> bool:

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

684

return len(self.ops) == 1 and self.ops[0].type == Op.DMA

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

685

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

686

def get_dma_src_tensor(self) -> "Optional[Tensor]":

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

687

# For weight tensors that need DMA: returns the source tensor in Flash, else None

688

# Note: for DMA ops, Pass.weight_tensor is referring to the SRAM weight tensor

689

return self.ops[0].inputs[0] if self.needs_dma() else None

690

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

691

def find_npu_op(self) -> Optional[Operation]:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

692

# Returns the NPU operator that uses this tensor, excluding DMA operators.

693

for op in self.consumers():

Louis Verhaard

2020-09-30 09:01:52 +0200

[diff] [blame]

694

if op.type == Op.DMA:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

695

return op.outputs[0].find_npu_op()

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

696

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

697

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

698

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

699

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

700

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

701

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

702

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

703

assert len(self.compressed_values) > 0

704

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

705

706

depth = coord[-1]

707

brick_depth = self.brick_size[-1]

708

# Clamp position at final element index

709

if depth > self.shape[-1]:

710

depth = self.shape[-1]

711

712

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

713

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

714

715

# Check boundaries on all but last weight set (which may be shorter

716

# than the brick we divided it up into)

717

if index < len(self.weight_compressed_offsets) - 1:

718

# There are no half-way points in the weights

719

if (depth % brick_depth) != 0:

720

raise Exception("Offset into weights must be aligned to a brick")

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

724

def size_of_compressed_stream(self, index: int) -> int:

725

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

726

assert 0 <= index < len(self.compressed_values)

727

return len(self.compressed_values[index])

728

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

729

def is_last_index_in_compressed_stream(self, index: int) -> bool:

730

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

731

assert 0 <= index < len(self.compressed_values)

732

return index == len(self.compressed_values) - 1

733

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

734

def address_offset_for_coordinate(self, orig_coord: Shape, is_top_box: bool = False) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

address_offset = 0

coord = orig_coord

coord = coord[-len(self.storage_shape) :]

739

740

if self.sub_purpose == TensorSubPurpose.Standard:

741

for idx, c in enumerate(coord):

742

if is_top_box:

743

assert c > 0 and c <= self.shape[idx]

744

else:

745

assert c >= 0 and c < self.shape[idx]

746

747

if self.format == TensorFormat.WeightsCompressed:

748

if len(self.weight_compressed_offsets) == 0:

749

return 0

750

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

751

if self.needs_dma() and self.sub_purpose == TensorSubPurpose.DoubleBuffer:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

752

depth = orig_coord[-1]

753

brick_depth = self.brick_size[-1]

754

# Clamp position at final element index

755

if depth > self.shape[-1]:

756

depth = self.shape[-1]

757

758

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

759

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

760

index = index % 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

761

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

762

763

if len(self.compressed_values) <= 2:

764

if is_top_box and index == 0:

765

for cv in self.compressed_values:

766

address_offset += len(cv)

767

else:

768

address_offset = index * len(self.compressed_values[0])

769

else:

770

if is_top_box and index == 0:

771

address_offset = self.storage_shape[-1]

772

else:

773

address_offset = index * (self.storage_shape[-1] // 2)

774

else:

775

index = self.compressed_stream_index_from_coord(orig_coord)

776

assert index < len(self.weight_compressed_offsets)

777

address_offset = self.weight_compressed_offsets[index]

778

else:

779

if is_top_box:

780

coord = [c - 1 for c in coord]

781

782

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

783

coord = [c % self.storage_shape[idx] for idx, c in enumerate(coord)]

784

785

strides, augmented_coord = self.get_strides_and_coord(coord)

if strides is None:

return None

if is_top_box:

address_offset += 1 * strides[-1] # one element

791

792

address_offset += np.dot(augmented_coord, strides)

793

794

assert address_offset >= 0

795

assert address_offset <= self.storage_size()

796

return address_offset

797

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

798

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

799

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

800

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

801

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

802

return self.equivalence_id == tens.equivalence_id

803

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

804

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

805

self.shape = shape

806

self.storage_shape = shape

807

self.bandwidth_shape = shape

808

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

809

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

810

d = len(self.shape)

811

if d in (1, 3):

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

812

return numeric_util.full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

813

elif d == 2:

814

return [self.shape[0], 1, 1, self.shape[1]]

815

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

816

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

817

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

818

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

819

# a tensor is quantized if it has an integral type and it contains valid quantization params

820

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

821

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

822

return False

823

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

824

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

825

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

826

def __str__(self):

827

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

828

829

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

830

831

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame^]

832

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

833

# checks that the scaling of two quantized tensors are equal

834

Tim Hall