Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

39

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

120

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

121

self.value

122

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

124

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

125

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

126

self.value

127

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

128

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

129

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

130

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

131

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

132

133

134

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

143

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

144

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

145

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

146

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

147

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

148

def all():

149

return (

150

TensorSubPurpose.Standard,

151

TensorSubPurpose.DoubleBuffer,

152

TensorSubPurpose.RollingBufferX,

153

TensorSubPurpose.RollingBufferY,

154

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

159

Unknown = 0

160

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

175

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

195

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

196

new_shp = list(shp)

197

198

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

199

for i in range(-1, -len(shp) - 1, -1):

200

if new_shp[i] is not None:

201

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

205

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

206

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

207

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

211

class QuantizationParameters:

212

__slots__ = "min", "max", "num_bits", "narrow_range", "scale_f32", "zero_point", "quant_min", "quant_max"

213

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

214

def __init__(

215

self,

216

min: Union[float, np.ndarray, None] = None,

217

max: Union[float, np.ndarray, None] = None,

218

num_bits=None,

219

narrow_range=None,

220

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

225

self.narrow_range = narrow_range

226

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

227

self.scale_f32: Union[float, np.ndarray, None] = None

228

self.zero_point: Union[int, np.ndarray, None] = None

229

self.quant_min: Optional[float] = None

230

self.quant_max: Optional[float] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

231

232

def __str__(self):

233

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

243

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

244

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

249

res.narrow_range = self.narrow_range

250

251

res.scale_f32 = self.scale_f32

252

res.zero_point = self.zero_point

253

res.quant_min = self.quant_min

254

res.quant_max = self.quant_max

255

return res

256

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

257

def dequantize(self, values) -> np.ndarray:

258

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

259

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

260

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

261

# quantisation parameter scaling is not equal if 'other' is None because

262

# it implies that the tensor it belongs to is not quantised. otherwise,

263

# it depends upon whether the scale and zero point are equal

264

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

265

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

266

return False

267

268

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

269

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

270

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

271

# quantisation parameters are consider valid if they have a scale and zero point

272

273

return None not in (self.scale_f32, self.zero_point)

274

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

275

def is_per_axis(self) -> bool:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

276

"""Returns True if either the scale, zero point, minimum or maximum values are arrays"""

277

for attr in ("scale_f32", "zero_point", "min", "max"):

278

if isinstance(getattr(self, attr), np.ndarray):

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

282

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

283

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

289

purpose: TensorPurpose = TensorPurpose.Unknown,

290

quantization: QuantizationParameters = None,

291

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

292

# Tensor

293

const_tensor = Tensor(shape, dtype, name + "_0")

294

const_tensor.purpose = purpose

295

const_tensor.quantization = quantization

296

const_tensor.values = np.array(values, dtype=value_dtype)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

297

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

298

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

299

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

300

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

304

# class that keeps track of all tensor addresses in the different memory types

305

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

306

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

307

308

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

309

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

310

return cls.address_map[tens_id].get(mem_type)

311

312

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

313

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

314

# Check previous address if there is one

315

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

316

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

317

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

318

319

# Set tensor's address for memory type

320

cls.address_map[tens_id][mem_type] = address

321

322

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

323

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

331

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

332

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

333

"ops",

334

"consumer_list",

335

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

336

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

337

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

338

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

339

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

345

"storage_compression_scale",

346

"bandwidth_compression_scale",

347

"compression_scale_for_worst_weight_stream",

348

"weight_compression_scales",

349

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

350

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

351

"storage_rounding_quantum",

352

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

353

"quantization",

354

"weight_compressed_offsets",

355

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

356

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

357

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

358

"resampling_mode",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

359

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

360

"needs_linear_format",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

361

)

362

AllocationQuantum = 16

363

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

364

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

365

self.shape = shape

366

self.storage_shape = shape

367

self.bandwidth_shape = shape

368

self.dtype = dtype

369

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

370

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

371

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

372

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

374

self.ops: List[Operation] = []

375

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

376

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

377

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

378

self.compressed_values: Optional[np.ndarray] = None

379

self.compressed_values_substream_offsets: Optional[List] = None

380

self.mem_area: MemArea = MemArea.Unknown

381

self.mem_type: MemType = MemType.Unknown

382

self.format: TensorFormat = TensorFormat.Unknown

383

self.purpose: TensorPurpose = TensorPurpose.Unknown

384

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

385

self.alignment: int = Tensor.AllocationQuantum

386

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

387

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

388

self.storage_compression_scale: float = 1.0

389

self.bandwidth_compression_scale: float = 1.0

390

self.compression_scale_for_worst_weight_stream: float = 1.0

391

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

392

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

393

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

394

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

395

self.value_id: UUID = uuid.uuid4()

396

self.weight_compressed_offsets: List = []

397

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

398

self.brick_size: Tuple = (1, 1, 1, 1)

399

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

400

401

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

402

self.quantization: Optional[QuantizationParameters] = None

403

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

404

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

406

self.needs_linear_format = True

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

407

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

408

# Reference to parent-tensor if this tensor is a clone

409

self.src_tensor = None

410

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

411

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

412

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

413

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

414

415

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

416

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

417

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

418

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

419

@property

420

def is_standard_fm(self) -> bool:

421

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

422

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

423

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

424

if self.element_size_bytes == 0:

425

return self.dtype.size_in_bits() / 8

426

return self.element_size_bytes

427

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

428

# Returns a copy, renamed to self.name + suffix

429

# The references to Operators will be empty when returned

430

# Depending on set_unique, the copy is shallow, or deep

431

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

432

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

433

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

434

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

435

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

436

res.storage_shape = list(self.storage_shape)

437

res.bandwidth_shape = list(self.bandwidth_shape)

438

if self.quantization is not None:

439

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

440

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

441

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

442

res.ops = []

443

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

444

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

445

return res

446

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

447

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

448

res = self.clone(suffix="_fast_storage")

449

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

450

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

451

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

452

return res

453

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

454

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

455

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

456

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

457

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

458

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

459

self.storage_shape = src_tens.storage_shape

460

self.brick_size = src_tens.brick_size

461

self.weight_compression_scales = src_tens.weight_compression_scales

462

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

463

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

464

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

465

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

466

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

467

self.block_traversal = src_tens.block_traversal

468

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

469

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

470

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

471

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

479

if shape_len > 4:

480

return

Louis Verhaard

04bd3e9

2021-08-19 16:36:32 +0200

[diff] [blame]

481

assert not (self.needs_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

482

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

483

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

484

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

485

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

486

if self.shape is None:

487

return

488

489

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

490

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

491

492

if fmt == TensorFormat.WeightsCompressed:

493

compression_ratio = 5 / 8

494

self.storage_compression_scale = compression_ratio

495

self.bandwidth_compression_scale = compression_ratio

496

self.compression_scale_for_worst_weight_stream = compression_ratio

497

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

498

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

499

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

504

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

505

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

510

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

511

return shape_fully_defined(self.shape)

512

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

513

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

514

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

515

if raw_size == 0:

516

raw_size = 1 # force it to take up space

517

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

518

return rounded_size

519

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

520

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

521

elems = shape_num_elements(op_storage_shape)

522

elems = elems if elems else 0

523

raw_size = elems * self.element_size()

524

if raw_size == 0:

525

raw_size = 1 # force it to take up space

526

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

527

return rounded_size

528

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

529

def storage_shape_for_sub_purpose(

530

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

531

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

532

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

533

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

534

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

535

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

536

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

537

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

538

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

539

if sub_purpose == TensorSubPurpose.RollingBufferX:

540

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

541

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

542

shp[0] = 1

543

shp[2] = min(shp[2], param_a)

544

elif sub_purpose == TensorSubPurpose.RollingBufferY:

545

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

546

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

547

shp[0] = 1

548

shp[1] = min(shp[1], param_a)

549

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

550

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

551

assert param_a is not None

552

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

553

shp[0] = 1

554

shp[2] = min(shp[2], param_a)

555

shp[1] = min(shp[1], param_b)

556

elif sub_purpose == TensorSubPurpose.Standard:

557

pass

558

else:

559

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

560

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

561

return shp

562

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

563

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

564

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

565

self.sub_purpose = sub_purpose

566

if sub_purpose == TensorSubPurpose.DoubleBuffer:

567

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

568

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

569

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

570

elems = shape_num_elements(self.bandwidth_shape)

571

if elems is None:

572

return 0

573

return elems * self.element_size() * self.bandwidth_compression_scale

574

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

575

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

576

return self.consumer_list

577

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

578

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

579

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

580

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

581

582

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, op_shape4D: Shape4D) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

583

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

584

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

585

if self.storage_shape == []:

return (

1,

1,

1,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

590

[self.address_for_coordinate(start_coord, op_shape4D=op_shape4D), None, None, None],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

591

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

592

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

593

if self.is_standard_fm:

594

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

595

else:

596

storage_shape_4D = Shape4D(self.storage_shape)

597

598

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

599

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

600

601

crossing_y = min(crossing_y, end_coord[1])

602

crossing_x = min(crossing_x, end_coord[2])

603

604

box_height0 = crossing_y - start_coord[1]

605

box_width = crossing_x - start_coord[2]

606

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

607

addresses: List = [None] * 4

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

608

addresses[0] = self.address_for_coordinate(start_coord, op_shape4D=op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

609

610

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

611

addresses[1] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

612

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

613

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

614

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

615

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

616

addresses[2] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

617

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

618

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

619

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

620

addresses[3] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

621

[start_coord[0], crossing_y, crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

622

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

623

624

return box_height0, box_height0, box_width, addresses

625

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

626

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, op_shape4D: Shape4D = None) -> int:

627

offset = self.address_offset_for_coordinate(coord, op_shape4D=op_shape4D, is_top_box=is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

628

assert offset is not None

629

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

630

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

631

def get_strides_and_coord(

632

self, coord: Optional[Shape] = None, shape4D: Optional[Shape4D] = None

633

) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

634

if coord is None:

Patrik Gustavsson

46408a8

2021-09-20 10:47:47 +0200

[diff] [blame^]

635

coord = [0] * min(len(self.storage_shape), 4)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

636

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

637

if shape4D and self.is_standard_fm:

638

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

639

else:

640

augmented_shape = full_shape(4, self.storage_shape, 1)

641

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

642

augmented_coord = coord

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

643

644

while len(augmented_coord) < 4:

645

augmented_coord = [0] + augmented_coord

646

647

assert len(augmented_coord) == len(augmented_shape)

648

649

if self.format == TensorFormat.NHWC:

650

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

651

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

652

653

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

654

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

655

augmented_shape = augmented_shape[0:4] + [1]

656

augmented_coord = (

657

[augmented_coord[0], augmented_coord[3] // channel_divisor]

658

+ augmented_coord[1:3]

659

+ [augmented_coord[3] % channel_divisor]

660

)

661

662

if augmented_shape[1] == 0:

663

augmented_shape[1] = 1

664

665

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

666

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

667

return None, None

668

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

669

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

670

stride = self.element_size() * self.storage_compression_scale

671

672

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

673

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

674

for i in stride_order:

675

strides[i] = stride

676

stride *= augmented_shape[i]

677

else:

678

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

679

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

680

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

681

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

682

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

683

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

684

685

return strides, augmented_coord

686

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

687

def get_strides(self, shape4D: Optional[Shape4D] = None) -> Shape:

688

strides, _ = self.get_strides_and_coord(shape4D=shape4D)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

689

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

690

return strides

691

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

692

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

693

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

694

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

695

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

696

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

697

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

698

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

699

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

700

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

701

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

702

assert len(self.compressed_values) > 0

703

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

704

705

depth = coord[-1]

706

brick_depth = self.brick_size[-1]

707

# Clamp position at final element index

708

if depth > self.shape[-1]:

709

depth = self.shape[-1]

710

711

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

712

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

713

714

# Check boundaries on all but last weight set (which may be shorter

715

# than the brick we divided it up into)

716

if index < len(self.weight_compressed_offsets) - 1:

717

# There are no half-way points in the weights

718

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

719

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

723

def size_of_compressed_stream(self, index: int) -> int:

724

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

725

assert 0 <= index < len(self.compressed_values)

726

return len(self.compressed_values[index])

727

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

728

def is_last_index_in_compressed_stream(self, index: int) -> bool:

729

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

730

assert 0 <= index < len(self.compressed_values)

731

return index == len(self.compressed_values) - 1

732

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

733

def address_offset_for_coordinate(

734

self, orig_coord: Shape, op_shape4D: Optional[Shape4D] = None, is_top_box: bool = False

735

) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

736

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

737

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

738

739

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

740

shape = op_shape4D.as_list() if op_shape4D else self.shape

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

741

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

742

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

743

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

744

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

745

assert c >= 0 and c < shape[idx]

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

746

coord = orig_coord

747

if op_shape4D and self.is_standard_fm:

748

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

749

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

750

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

751

storage_shape = self.storage_shape

752

coord = coord[-len(storage_shape) :]

753

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

754

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

755

if is_top_box:

756

coord = [c - 1 for c in coord]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

757

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

758

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

759

coord = [c % storage_shape[idx] for idx, c in enumerate(coord)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

760

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

761

strides, augmented_coord = self.get_strides_and_coord(coord, op_shape4D)

762

if strides is None:

763

return None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

764

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

765

if is_top_box:

766

address_offset += 1 * strides[-1] # one element

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

767

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

768

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

769

770

assert address_offset >= 0

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

771

assert address_offset <= storage_size

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

772

return address_offset

773

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

774

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

775

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

776

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

777

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

778

return self.equivalence_id == tens.equivalence_id

779

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

780

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

781

self.shape = shape

782

self.storage_shape = shape

783

self.bandwidth_shape = shape

784

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

785

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

786

d = len(self.shape)

787

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

788

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

789

elif d == 2:

790

return [self.shape[0], 1, 1, self.shape[1]]

791

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

792

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

793

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

794

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

795

# a tensor is quantized if it has an integral type and it contains valid quantization params

796

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

797

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

798

return False

799

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

800

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

801

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

802

def get_scalar(self):

803

"""

804

return: Unquantized or dequantized scalar value

805

rtype: self.dtype (if unquantized) or float (if dequantized)

806

"""

807

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

808

if self.is_quantized():

809

return self.quantization.dequantize(self.values).item(0)

810

else:

811

return self.values.item(0)

812

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

813

def __lt__(self, other: "Tensor") -> bool:

814

return self.equivalence_id < other.equivalence_id

815

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

816

def __str__(self):

817

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

818

819

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

820

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

821

def error(self, msg):

822

"""

823

Raises a VelaError exception for errors encountered when parsing a Tensor

824

825

:param self: Tensor object that resulted in the error

826

:param msg: str object that contains a description of the specific error encountered

827

"""

828

829

def _print_operators(ops):

830

lines = []

831

for idx, op in enumerate(ops):

832

op_type = getattr(op, "type", "Not an Operation")

833

op_id = getattr(op, "op_index", "-")

834

lines.append(f" {idx} = {op_type} ({op_id})")

835

return lines

836

837

lines = [f"Invalid {self.name} tensor. {msg}"]

838

839

lines += [" Driving operators:"]

840

lines += _print_operators(self.ops)

841

842

lines += [" Consuming operators:"]

843

lines += _print_operators(self.consumer_list)

844

845

raise VelaError("\n".join(lines))

846

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

847

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

848

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

849

# checks that the scaling of two quantized tensors are equal

850

Tim Hall