Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

39

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

120

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

121

self.value

122

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

124

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

125

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

126

self.value

127

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

128

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

129

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

130

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

131

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

132

133

134

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

143

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

144

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

145

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

146

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

147

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

148

def all():

149

return (

150

TensorSubPurpose.Standard,

151

TensorSubPurpose.DoubleBuffer,

152

TensorSubPurpose.RollingBufferX,

153

TensorSubPurpose.RollingBufferY,

154

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

159

Unknown = 0

160

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

175

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

195

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

196

new_shp = list(shp)

197

198

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

199

for i in range(-1, -len(shp) - 1, -1):

200

if new_shp[i] is not None:

201

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

205

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

206

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

207

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

211

class QuantizationParameters:

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

__slots__ = (

"min",

"max",

"num_bits",

"narrow_range",

"scale_f32",

"zero_point",

"quant_min",

"quant_max",

"quant_dim",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

223

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

224

def __init__(

225

self,

226

min: Union[float, np.ndarray, None] = None,

227

max: Union[float, np.ndarray, None] = None,

228

num_bits=None,

229

narrow_range=None,

230

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

235

self.narrow_range = narrow_range

236

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

237

self.scale_f32: Union[float, np.ndarray, None] = None

238

self.zero_point: Union[int, np.ndarray, None] = None

239

self.quant_min: Optional[float] = None

240

self.quant_max: Optional[float] = None

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

241

self.quant_dim: Optional[int] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

242

243

def __str__(self):

244

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

254

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

255

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

260

res.narrow_range = self.narrow_range

261

262

res.scale_f32 = self.scale_f32

263

res.zero_point = self.zero_point

264

res.quant_min = self.quant_min

265

res.quant_max = self.quant_max

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

266

res.quant_dim = self.quant_dim

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

267

return res

268

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

269

def dequantize(self, values) -> np.ndarray:

270

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

271

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

272

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

273

# quantisation parameter scaling is not equal if 'other' is None because

274

# it implies that the tensor it belongs to is not quantised. otherwise,

275

# it depends upon whether the scale and zero point are equal

276

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

277

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

278

return False

279

280

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

281

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

282

def is_valid(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

283

# quantisation parameters are consider valid if they have a scale and zero point

284

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

285

return self.scale_f32 is not None and self.zero_point is not None

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

286

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

287

def is_per_axis(self) -> bool:

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

288

"""Returns True if either the scale, zero point, minimum or maximum values have more than one value"""

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

289

for attr in ("scale_f32", "zero_point", "min", "max"):

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

290

if np.size(getattr(self, attr)) > 1:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

294

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

295

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

301

purpose: TensorPurpose = TensorPurpose.Unknown,

302

quantization: QuantizationParameters = None,

303

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

304

# Tensor

305

const_tensor = Tensor(shape, dtype, name + "_0")

306

const_tensor.purpose = purpose

307

const_tensor.quantization = quantization

308

const_tensor.values = np.array(values, dtype=value_dtype)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

309

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

310

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

311

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

312

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

316

# class that keeps track of all tensor addresses in the different memory types

317

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

318

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

319

320

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

321

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

322

return cls.address_map[tens_id].get(mem_type)

323

324

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

325

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

326

# Check previous address if there is one

327

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

328

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

329

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

330

331

# Set tensor's address for memory type

332

cls.address_map[tens_id][mem_type] = address

333

334

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

335

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

343

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

344

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

345

"ops",

346

"consumer_list",

347

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

348

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

349

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

350

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

351

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

357

"storage_compression_scale",

358

"bandwidth_compression_scale",

359

"compression_scale_for_worst_weight_stream",

360

"weight_compression_scales",

361

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

362

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

363

"storage_rounding_quantum",

364

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

365

"quantization",

366

"weight_compressed_offsets",

367

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

368

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

369

"equivalence_id",

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

370

"resampling_mode",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

371

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

372

"needs_linear_format",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

)

374

AllocationQuantum = 16

375

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

376

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

377

self.shape = shape

378

self.storage_shape = shape

379

self.bandwidth_shape = shape

380

self.dtype = dtype

381

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

382

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

383

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

384

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

385

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

386

self.ops: List[Operation] = []

387

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

388

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

389

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

390

self.compressed_values: Optional[np.ndarray] = None

391

self.compressed_values_substream_offsets: Optional[List] = None

392

self.mem_area: MemArea = MemArea.Unknown

393

self.mem_type: MemType = MemType.Unknown

394

self.format: TensorFormat = TensorFormat.Unknown

395

self.purpose: TensorPurpose = TensorPurpose.Unknown

396

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

397

self.alignment: int = Tensor.AllocationQuantum

398

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

399

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

400

self.storage_compression_scale: float = 1.0

401

self.bandwidth_compression_scale: float = 1.0

402

self.compression_scale_for_worst_weight_stream: float = 1.0

403

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

404

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

405

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

406

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

407

self.value_id: UUID = uuid.uuid4()

408

self.weight_compressed_offsets: List = []

409

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

410

self.brick_size: Tuple = (1, 1, 1, 1)

411

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

412

413

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

414

self.quantization: Optional[QuantizationParameters] = None

415

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

416

self.resampling_mode: resampling_mode = resampling_mode.NONE

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

417

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

418

self.needs_linear_format = True

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

419

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

420

# Reference to parent-tensor if this tensor is a clone

421

self.src_tensor = None

422

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

423

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

424

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

425

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

426

427

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

428

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

429

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

430

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

431

@property

432

def is_standard_fm(self) -> bool:

433

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

434

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

435

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

436

if self.element_size_bytes == 0:

Diqing Zhong

e3d18b0

2021-11-15 13:53:10 +0100

[diff] [blame^]

437

return self.dtype.size_in_bits() // 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

438

return self.element_size_bytes

439

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

440

# Returns a copy, renamed to self.name + suffix

441

# The references to Operators will be empty when returned

442

# Depending on set_unique, the copy is shallow, or deep

443

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

444

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

445

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

446

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

447

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

448

res.storage_shape = list(self.storage_shape)

449

res.bandwidth_shape = list(self.bandwidth_shape)

450

if self.quantization is not None:

451

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

452

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

453

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

454

res.ops = []

455

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

456

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

457

return res

458

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

459

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

460

res = self.clone(suffix="_fast_storage")

461

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

462

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

463

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

464

return res

465

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

466

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

467

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

468

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

469

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

470

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

471

self.storage_shape = src_tens.storage_shape

472

self.brick_size = src_tens.brick_size

473

self.weight_compression_scales = src_tens.weight_compression_scales

474

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

475

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

476

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

477

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

478

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

479

self.block_traversal = src_tens.block_traversal

480

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

481

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

482

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

483

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

491

if shape_len > 4:

492

return

Louis Verhaard

04bd3e9

2021-08-19 16:36:32 +0200

[diff] [blame]

493

assert not (self.needs_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

494

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

495

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

496

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

497

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

498

if self.shape is None:

499

return

500

501

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

502

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

503

504

if fmt == TensorFormat.WeightsCompressed:

505

compression_ratio = 5 / 8

506

self.storage_compression_scale = compression_ratio

507

self.bandwidth_compression_scale = compression_ratio

508

self.compression_scale_for_worst_weight_stream = compression_ratio

509

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

510

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

511

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

516

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

517

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

522

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

523

return shape_fully_defined(self.shape)

524

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

525

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

526

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

527

if raw_size == 0:

528

raw_size = 1 # force it to take up space

529

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

530

return rounded_size

531

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

532

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

533

elems = shape_num_elements(op_storage_shape)

534

elems = elems if elems else 0

535

raw_size = elems * self.element_size()

536

if raw_size == 0:

537

raw_size = 1 # force it to take up space

538

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

539

return rounded_size

540

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

541

def storage_shape_for_sub_purpose(

542

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

543

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

544

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

545

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

546

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

547

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

548

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

549

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

550

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

551

if sub_purpose == TensorSubPurpose.RollingBufferX:

552

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

553

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

554

shp[0] = 1

555

shp[2] = min(shp[2], param_a)

556

elif sub_purpose == TensorSubPurpose.RollingBufferY:

557

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

558

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

559

shp[0] = 1

560

shp[1] = min(shp[1], param_a)

561

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

562

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

563

assert param_a is not None

564

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

565

shp[0] = 1

566

shp[2] = min(shp[2], param_a)

567

shp[1] = min(shp[1], param_b)

568

elif sub_purpose == TensorSubPurpose.Standard:

569

pass

570

else:

571

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

572

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

573

return shp

574

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

575

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

576

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

577

self.sub_purpose = sub_purpose

578

if sub_purpose == TensorSubPurpose.DoubleBuffer:

579

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

580

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

581

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

582

elems = shape_num_elements(self.bandwidth_shape)

583

if elems is None:

584

return 0

585

return elems * self.element_size() * self.bandwidth_compression_scale

586

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

587

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

588

return self.consumer_list

589

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

590

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

591

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

592

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

593

594

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, op_shape4D: Shape4D) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

595

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

596

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

597

if self.storage_shape == []:

return (

1,

1,

1,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

602

[self.address_for_coordinate(start_coord, op_shape4D=op_shape4D), None, None, None],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

603

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

604

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

605

if self.is_standard_fm:

606

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

607

else:

608

storage_shape_4D = Shape4D(self.storage_shape)

609

610

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

611

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

612

613

crossing_y = min(crossing_y, end_coord[1])

614

crossing_x = min(crossing_x, end_coord[2])

615

616

box_height0 = crossing_y - start_coord[1]

617

box_width = crossing_x - start_coord[2]

618

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

619

addresses: List = [None] * 4

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

620

addresses[0] = self.address_for_coordinate(start_coord, op_shape4D=op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

621

622

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

623

addresses[1] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

624

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

625

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

626

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

627

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

628

addresses[2] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

629

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

630

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

631

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

632

addresses[3] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

633

[start_coord[0], crossing_y, crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

634

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

635

636

return box_height0, box_height0, box_width, addresses

637

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

638

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, op_shape4D: Shape4D = None) -> int:

639

offset = self.address_offset_for_coordinate(coord, op_shape4D=op_shape4D, is_top_box=is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

640

assert offset is not None

641

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

642

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

643

def get_strides_and_coord(

644

self, coord: Optional[Shape] = None, shape4D: Optional[Shape4D] = None

645

) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

646

if coord is None:

Patrik Gustavsson

46408a8

2021-09-20 10:47:47 +0200

[diff] [blame]

647

coord = [0] * min(len(self.storage_shape), 4)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

648

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

649

if shape4D and self.is_standard_fm:

650

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

651

else:

652

augmented_shape = full_shape(4, self.storage_shape, 1)

653

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

654

augmented_coord = coord

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

655

656

while len(augmented_coord) < 4:

657

augmented_coord = [0] + augmented_coord

658

659

assert len(augmented_coord) == len(augmented_shape)

660

661

if self.format == TensorFormat.NHWC:

662

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

663

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

664

665

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

666

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

667

augmented_shape = augmented_shape[0:4] + [1]

668

augmented_coord = (

669

[augmented_coord[0], augmented_coord[3] // channel_divisor]

670

+ augmented_coord[1:3]

671

+ [augmented_coord[3] % channel_divisor]

672

)

673

674

if augmented_shape[1] == 0:

675

augmented_shape[1] = 1

676

677

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

678

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

679

return None, None

680

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

681

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

682

stride = self.element_size() * self.storage_compression_scale

683

684

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

685

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

686

for i in stride_order:

687

strides[i] = stride

688

stride *= augmented_shape[i]

689

else:

690

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

691

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

692

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

693

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

694

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

695

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

696

697

return strides, augmented_coord

698

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

699

def get_strides(self, shape4D: Optional[Shape4D] = None) -> Shape:

700

strides, _ = self.get_strides_and_coord(shape4D=shape4D)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

701

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

702

return strides

703

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

704

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

705

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

706

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

707

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

708

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

709

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

710

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

711

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

712

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

713

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

714

assert len(self.compressed_values) > 0

715

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

716

717

depth = coord[-1]

718

brick_depth = self.brick_size[-1]

719

# Clamp position at final element index

720

if depth > self.shape[-1]:

721

depth = self.shape[-1]

722

723

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

724

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

725

726

# Check boundaries on all but last weight set (which may be shorter

727

# than the brick we divided it up into)

728

if index < len(self.weight_compressed_offsets) - 1:

729

# There are no half-way points in the weights

730

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

731

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

735

def size_of_compressed_stream(self, index: int) -> int:

736

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

737

assert 0 <= index < len(self.compressed_values)

738

return len(self.compressed_values[index])

739

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

740

def is_last_index_in_compressed_stream(self, index: int) -> bool:

741

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

742

assert 0 <= index < len(self.compressed_values)

743

return index == len(self.compressed_values) - 1

744

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

745

def address_offset_for_coordinate(

746

self, orig_coord: Shape, op_shape4D: Optional[Shape4D] = None, is_top_box: bool = False

747

) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

748

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

749

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

750

751

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

752

shape = op_shape4D.as_list() if op_shape4D else self.shape

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

753

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

754

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

755

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

756

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

757

assert c >= 0 and c < shape[idx]

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

758

coord = orig_coord

759

if op_shape4D and self.is_standard_fm:

760

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

761

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

762

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

763

storage_shape = self.storage_shape

764

coord = coord[-len(storage_shape) :]

765

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

766

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

767

if is_top_box:

768

coord = [c - 1 for c in coord]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

769

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

770

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

771

coord = [c % storage_shape[idx] for idx, c in enumerate(coord)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

772

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

773

strides, augmented_coord = self.get_strides_and_coord(coord, op_shape4D)

774

if strides is None:

775

return None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

776

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

777

if is_top_box:

778

address_offset += 1 * strides[-1] # one element

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

779

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

780

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

781

782

assert address_offset >= 0

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

783

assert address_offset <= storage_size

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

784

return address_offset

785

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

786

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

787

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

788

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

789

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

790

return self.equivalence_id == tens.equivalence_id

791

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

792

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

793

self.shape = shape

794

self.storage_shape = shape

795

self.bandwidth_shape = shape

796

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

797

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

798

d = len(self.shape)

799

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

800

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

801

elif d == 2:

802

return [self.shape[0], 1, 1, self.shape[1]]

803

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

804

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

805

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

806

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

807

# a tensor is quantized if it has an integral type and it contains valid quantization params

808

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

809

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

810

return False

811

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

812

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

813

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

814

def get_scalar(self):

815

"""

816

return: Unquantized or dequantized scalar value

817

rtype: self.dtype (if unquantized) or float (if dequantized)

818

"""

819

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

820

if self.is_quantized():

821

return self.quantization.dequantize(self.values).item(0)

822

else:

823

return self.values.item(0)

824

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

825

def __lt__(self, other: "Tensor") -> bool:

826

return self.equivalence_id < other.equivalence_id

827

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

828

def __str__(self):

829

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

830

831

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

832

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

833

def error(self, msg):

834

"""

835

Raises a VelaError exception for errors encountered when parsing a Tensor

836

837

:param self: Tensor object that resulted in the error

838

:param msg: str object that contains a description of the specific error encountered

839

"""

840

841

def _print_operators(ops):

842

lines = []

843

for idx, op in enumerate(ops):

844

op_type = getattr(op, "type", "Not an Operation")

845

op_id = getattr(op, "op_index", "-")

846

lines.append(f" {idx} = {op_type} ({op_id})")

847

return lines

848

849

lines = [f"Invalid {self.name} tensor. {msg}"]

850

851

lines += [" Driving operators:"]

852

lines += _print_operators(self.ops)

853

854

lines += [" Consuming operators:"]

855

lines += _print_operators(self.consumer_list)

856

857

raise VelaError("\n".join(lines))

858

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

859

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

860

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

861

# checks that the scaling of two quantized tensors are equal

862

Tim Hall