Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

16

# Description:

17

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

18

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

21

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

22

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

23

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

24

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

25

from typing import Dict

26

from typing import List

27

from typing import Optional

28

from typing import Tuple

29

from typing import Union

30

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

35

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

36

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

37

from .errors import UnsupportedFeatureError

38

from .errors import VelaError

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

39

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

40

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

41

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

42

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

43

44

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

45

46

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

47

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

54

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

55

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

56

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

57

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

58

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

59

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

60

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

61

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

62

def all():

63

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

69

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

75

return self.name

76

77

def identifier_name(self):

78

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

83

84

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

85

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

91

Shram = 5 # for LUT

92

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

93

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

94

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

95

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

96

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

97

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

98

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

99

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

100

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

101

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

102

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

117

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

118

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

119

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

120

self.value

121

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

122

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

123

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

124

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

125

self.value

126

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

127

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

128

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

129

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

130

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

131

132

133

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

140

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

141

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

142

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

143

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

144

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

145

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

146

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

147

def all():

148

return (

149

TensorSubPurpose.Standard,

150

TensorSubPurpose.DoubleBuffer,

151

TensorSubPurpose.RollingBufferX,

152

TensorSubPurpose.RollingBufferY,

153

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

158

Unknown = 0

159

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

174

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

185

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

194

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

195

new_shp = list(shp)

196

197

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

198

for i in range(-1, -len(shp) - 1, -1):

199

if new_shp[i] is not None:

200

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

204

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

205

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

206

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

210

class QuantizationParameters:

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

__slots__ = (

"min",

"max",

"num_bits",

"narrow_range",

"scale_f32",

"zero_point",

"quant_min",

"quant_max",

"quant_dim",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

222

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

223

def __init__(

224

self,

225

min: Union[float, np.ndarray, None] = None,

226

max: Union[float, np.ndarray, None] = None,

227

num_bits=None,

228

narrow_range=None,

229

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

234

self.narrow_range = narrow_range

235

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

236

self.scale_f32: Union[float, np.ndarray, None] = None

237

self.zero_point: Union[int, np.ndarray, None] = None

238

self.quant_min: Optional[float] = None

239

self.quant_max: Optional[float] = None

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

240

self.quant_dim: Optional[int] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

241

242

def __str__(self):

243

return "<nng.QuantizationParameters min=%s max=%s, num_bits=%s, scale=%s, zero_point=%s>" % (

self.min,

self.max,

self.num_bits,

self.scale_f32,

self.zero_point,

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

253

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

254

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

259

res.narrow_range = self.narrow_range

260

261

res.scale_f32 = self.scale_f32

262

res.zero_point = self.zero_point

263

res.quant_min = self.quant_min

264

res.quant_max = self.quant_max

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

265

res.quant_dim = self.quant_dim

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

266

return res

267

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

268

def dequantize(self, values) -> np.ndarray:

269

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

270

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

271

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

272

"""

273

Returns True if the scale and zero point of self and other are equal. If other is None then the scaling is

274

not considered equal because the tensor is assumed to not be quantised and False will be returned

275

"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

276

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

277

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

278

return False

279

280

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

281

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

282

def is_valid(self) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

283

"""Return True if the quantisation parameters have a scale and zero point"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

284

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

285

return self.scale_f32 is not None and self.zero_point is not None

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

286

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

287

def is_per_axis(self) -> bool:

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

288

"""Returns True if either the scale, zero point, minimum or maximum values have more than one value"""

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

289

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

290

for attr in ("scale_f32", "zero_point", "min", "max"):

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

291

if np.size(getattr(self, attr)) > 1:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

295

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

296

def create_const_tensor(

name: str,

shape: Shape,

dtype: DataType,

values: np.ndarray,

value_dtype: np.dtype = None,

302

purpose: TensorPurpose = TensorPurpose.Unknown,

303

quantization: QuantizationParameters = None,

304

):

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

305

# Tensor

306

const_tensor = Tensor(shape, dtype, name + "_0")

307

const_tensor.purpose = purpose

308

const_tensor.quantization = quantization

309

const_tensor.values = np.array(values, dtype=value_dtype)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

310

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

311

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

312

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

313

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

317

# class that keeps track of all tensor addresses in the different memory types

318

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

319

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

320

321

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

322

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

323

return cls.address_map[tens_id].get(mem_type)

324

325

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

326

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

327

# Check previous address if there is one

328

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

329

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

330

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

331

332

# Set tensor's address for memory type

333

cls.address_map[tens_id][mem_type] = address

334

335

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

336

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class Tensor:

__slots__ = (

"shape",

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

344

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

345

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

346

"ops",

347

"consumer_list",

348

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

349

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

350

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

351

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

352

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

358

"storage_compression_scale",

359

"bandwidth_compression_scale",

360

"compression_scale_for_worst_weight_stream",

361

"weight_compression_scales",

362

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

363

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

364

"storage_rounding_quantum",

365

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

366

"quantization",

367

"weight_compressed_offsets",

368

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

369

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

370

"equivalence_id",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

371

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

372

"needs_linear_format",

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

373

"ifm_write_protected",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

374

)

375

AllocationQuantum = 16

376

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

377

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

378

self.shape = shape

379

self.storage_shape = shape

380

self.bandwidth_shape = shape

381

self.dtype = dtype

382

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

383

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

384

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

385

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

386

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

387

self.ops: List[Operation] = []

388

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

389

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

390

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

391

self.compressed_values: Optional[np.ndarray] = None

392

self.compressed_values_substream_offsets: Optional[List] = None

393

self.mem_area: MemArea = MemArea.Unknown

394

self.mem_type: MemType = MemType.Unknown

395

self.format: TensorFormat = TensorFormat.Unknown

396

self.purpose: TensorPurpose = TensorPurpose.Unknown

397

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

398

self.alignment: int = Tensor.AllocationQuantum

399

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

400

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

401

self.storage_compression_scale: float = 1.0

402

self.bandwidth_compression_scale: float = 1.0

403

self.compression_scale_for_worst_weight_stream: float = 1.0

404

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

405

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

406

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

407

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

408

self.value_id: UUID = uuid.uuid4()

409

self.weight_compressed_offsets: List = []

410

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

411

self.brick_size: Tuple = (1, 1, 1, 1)

412

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

413

414

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

415

self.quantization: Optional[QuantizationParameters] = None

416

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

417

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

418

self.needs_linear_format = True

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

419

self.ifm_write_protected = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

420

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

421

# Reference to parent-tensor if this tensor is a clone

Jonas Ohlsson

845e232

2022-03-01 12:39:55 +0100

[diff] [blame]

422

self.src_tensor: Optional[Tensor] = None

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

423

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

424

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

425

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

426

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

427

428

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

429

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

430

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

431

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

432

@property

433

def is_standard_fm(self) -> bool:

434

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

435

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

436

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

437

if self.element_size_bytes == 0:

Diqing Zhong

e3d18b0

2021-11-15 13:53:10 +0100

[diff] [blame]

438

return self.dtype.size_in_bits() // 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

439

return self.element_size_bytes

440

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

441

# Returns a copy, renamed to self.name + suffix

442

# The references to Operators will be empty when returned

443

# Depending on set_unique, the copy is shallow, or deep

444

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

445

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

446

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

447

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

448

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

449

res.storage_shape = list(self.storage_shape)

450

res.bandwidth_shape = list(self.bandwidth_shape)

451

if self.quantization is not None:

452

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

453

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

454

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

455

res.ops = []

456

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

457

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

458

return res

459

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

460

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

461

res = self.clone(suffix="_fast_storage")

462

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

463

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

464

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

465

return res

466

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

467

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

468

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

469

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

470

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

471

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

472

self.storage_shape = src_tens.storage_shape

473

self.brick_size = src_tens.brick_size

474

self.weight_compression_scales = src_tens.weight_compression_scales

475

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

476

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

477

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

478

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

479

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

480

self.block_traversal = src_tens.block_traversal

481

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

482

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

483

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

484

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

492

if shape_len > 4:

493

return

Louis Verhaard

04bd3e9

2021-08-19 16:36:32 +0200

[diff] [blame]

494

assert not (self.needs_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

495

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

496

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

497

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

498

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

499

if self.shape is None:

500

return

501

502

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

503

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

504

505

if fmt == TensorFormat.WeightsCompressed:

506

compression_ratio = 5 / 8

507

self.storage_compression_scale = compression_ratio

508

self.bandwidth_compression_scale = compression_ratio

509

self.compression_scale_for_worst_weight_stream = compression_ratio

510

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

511

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

512

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

517

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

518

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

523

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

524

return shape_fully_defined(self.shape)

525

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

526

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

527

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

528

if raw_size == 0:

529

raw_size = 1 # force it to take up space

530

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

531

return rounded_size

532

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

533

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

534

elems = shape_num_elements(op_storage_shape)

535

elems = elems if elems else 0

536

raw_size = elems * self.element_size()

537

if raw_size == 0:

538

raw_size = 1 # force it to take up space

539

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

540

return rounded_size

541

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

542

def storage_shape_for_sub_purpose(

543

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

544

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

545

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

546

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

547

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

548

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

549

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

550

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

551

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

552

if sub_purpose == TensorSubPurpose.RollingBufferX:

553

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

554

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

555

shp[0] = 1

556

shp[2] = min(shp[2], param_a)

557

elif sub_purpose == TensorSubPurpose.RollingBufferY:

558

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

559

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

560

shp[0] = 1

561

shp[1] = min(shp[1], param_a)

562

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

563

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

564

assert param_a is not None

565

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

566

shp[0] = 1

567

shp[2] = min(shp[2], param_a)

568

shp[1] = min(shp[1], param_b)

569

elif sub_purpose == TensorSubPurpose.Standard:

570

pass

571

else:

572

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

573

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

574

return shp

575

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

576

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

577

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

578

self.sub_purpose = sub_purpose

579

if sub_purpose == TensorSubPurpose.DoubleBuffer:

580

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

581

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

582

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

583

elems = shape_num_elements(self.bandwidth_shape)

584

if elems is None:

585

return 0

586

return elems * self.element_size() * self.bandwidth_compression_scale

587

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

588

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

589

return self.consumer_list

590

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

591

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

592

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

593

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

594

595

def addresses_for_rolling_buffer(self, start_coord: Shape, end_coord: Shape, op_shape4D: Shape4D) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

596

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

597

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

598

if self.storage_shape == []:

return (

1,

1,

1,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

603

[self.address_for_coordinate(start_coord, op_shape4D=op_shape4D), None, None, None],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

604

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

605

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

606

if self.is_standard_fm:

607

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

608

else:

609

storage_shape_4D = Shape4D(self.storage_shape)

610

611

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

612

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

613

614

crossing_y = min(crossing_y, end_coord[1])

615

crossing_x = min(crossing_x, end_coord[2])

616

617

box_height0 = crossing_y - start_coord[1]

618

box_width = crossing_x - start_coord[2]

619

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

620

addresses: List = [None] * 4

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

621

addresses[0] = self.address_for_coordinate(start_coord, op_shape4D=op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

622

623

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

624

addresses[1] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

625

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

626

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

627

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

628

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

629

addresses[2] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

630

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

631

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

632

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

633

addresses[3] = self.address_for_coordinate(

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

634

[start_coord[0], crossing_y, crossing_x, start_coord[3]], op_shape4D=op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

635

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

636

637

return box_height0, box_height0, box_width, addresses

638

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

639

def address_for_coordinate(self, coord: Shape, is_top_box: bool = False, op_shape4D: Shape4D = None) -> int:

640

offset = self.address_offset_for_coordinate(coord, op_shape4D=op_shape4D, is_top_box=is_top_box)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

641

assert offset is not None

642

return self.address + offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

643

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

644

def get_strides_and_coord(

645

self, coord: Optional[Shape] = None, shape4D: Optional[Shape4D] = None

646

) -> Tuple[Optional[Shape], Optional[Shape]]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

647

if coord is None:

Patrik Gustavsson

46408a8

2021-09-20 10:47:47 +0200

[diff] [blame]

648

coord = [0] * min(len(self.storage_shape), 4)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

649

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

650

if shape4D and self.is_standard_fm:

651

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

652

else:

653

augmented_shape = full_shape(4, self.storage_shape, 1)

654

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

655

augmented_coord = coord

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

656

657

while len(augmented_coord) < 4:

658

augmented_coord = [0] + augmented_coord

659

660

assert len(augmented_coord) == len(augmented_shape)

661

662

if self.format == TensorFormat.NHWC:

663

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

664

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

665

666

elif self.format == TensorFormat.NHCWB16:

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

667

channel_divisor = 16

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

668

augmented_shape = augmented_shape[0:4] + [1]

669

augmented_coord = (

670

[augmented_coord[0], augmented_coord[3] // channel_divisor]

671

+ augmented_coord[1:3]

672

+ [augmented_coord[3] % channel_divisor]

673

)

674

675

if augmented_shape[1] == 0:

676

augmented_shape[1] = 1

677

678

else:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

679

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

680

return None, None

681

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

682

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

683

stride = self.element_size() * self.storage_compression_scale

684

685

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

686

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

687

for i in stride_order:

688

strides[i] = stride

689

stride *= augmented_shape[i]

690

else:

691

assert len(strides) == 5

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

692

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

693

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

694

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

695

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

696

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

697

698

return strides, augmented_coord

699

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

700

def get_strides(self, shape4D: Optional[Shape4D] = None) -> Shape:

701

strides, _ = self.get_strides_and_coord(shape4D=shape4D)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

702

assert strides is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

703

return strides

704

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

705

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

706

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

707

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

708

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

709

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

710

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

711

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

712

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

713

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

714

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

715

assert len(self.compressed_values) > 0

716

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

717

718

depth = coord[-1]

719

brick_depth = self.brick_size[-1]

720

# Clamp position at final element index

721

if depth > self.shape[-1]:

722

depth = self.shape[-1]

723

724

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

725

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

726

727

# Check boundaries on all but last weight set (which may be shorter

728

# than the brick we divided it up into)

729

if index < len(self.weight_compressed_offsets) - 1:

730

# There are no half-way points in the weights

731

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

732

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

736

def size_of_compressed_stream(self, index: int) -> int:

737

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

738

assert 0 <= index < len(self.compressed_values)

739

return len(self.compressed_values[index])

740

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

741

def is_last_index_in_compressed_stream(self, index: int) -> bool:

742

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

743

assert 0 <= index < len(self.compressed_values)

744

return index == len(self.compressed_values) - 1

745

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

746

def address_offset_for_coordinate(

747

self, orig_coord: Shape, op_shape4D: Optional[Shape4D] = None, is_top_box: bool = False

748

) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

749

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

750

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

751

752

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

753

shape = op_shape4D.as_list() if op_shape4D else self.shape

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

754

for idx, c in enumerate(orig_coord):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

755

if is_top_box:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

756

assert c > 0 and c <= shape[idx]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

757

else:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

758

assert c >= 0 and c < shape[idx]

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

759

coord = orig_coord

760

if op_shape4D and self.is_standard_fm:

761

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

762

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

763

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

764

storage_shape = self.storage_shape

765

coord = coord[-len(storage_shape) :]

766

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

767

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

768

if is_top_box:

769

coord = [c - 1 for c in coord]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

770

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

771

# handle wraparound for partial buffers. make sure to do this after subtracting top box:

772

coord = [c % storage_shape[idx] for idx, c in enumerate(coord)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

773

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

774

strides, augmented_coord = self.get_strides_and_coord(coord, op_shape4D)

775

if strides is None:

776

return None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

777

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

778

if is_top_box:

779

address_offset += 1 * strides[-1] # one element

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

780

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

781

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

782

783

assert address_offset >= 0

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

784

assert address_offset <= storage_size

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

785

return address_offset

786

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

787

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

788

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

789

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

790

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

791

return self.equivalence_id == tens.equivalence_id

792

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

793

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

794

self.shape = shape

795

self.storage_shape = shape

796

self.bandwidth_shape = shape

797

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

798

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

799

d = len(self.shape)

800

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

801

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

802

elif d == 2:

803

return [self.shape[0], 1, 1, self.shape[1]]

804

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

805

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

806

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

807

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

808

# a tensor is quantized if it has an integral type and it contains valid quantization params

809

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

810

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

811

return False

812

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

813

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

814

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

815

def get_scalar(self):

816

"""

817

return: Unquantized or dequantized scalar value

818

rtype: self.dtype (if unquantized) or float (if dequantized)

819

"""

820

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

821

if self.is_quantized():

822

return self.quantization.dequantize(self.values).item(0)

823

else:

824

return self.values.item(0)

825

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

826

def __lt__(self, other: "Tensor") -> bool:

827

return self.equivalence_id < other.equivalence_id

828

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

829

def __str__(self):

830

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

831

832

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

833

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

834

def error(self, msg):

835

"""

836

Raises a VelaError exception for errors encountered when parsing a Tensor

837

838

:param self: Tensor object that resulted in the error

839

:param msg: str object that contains a description of the specific error encountered

840

"""

841

842

def _print_operators(ops):

843

lines = []

844

for idx, op in enumerate(ops):

845

op_type = getattr(op, "type", "Not an Operation")

846

op_id = getattr(op, "op_index", "-")

847

lines.append(f" {idx} = {op_type} ({op_id})")

848

return lines

849

850

lines = [f"Invalid {self.name} tensor. {msg}"]

851

852

lines += [" Driving operators:"]

853

lines += _print_operators(self.ops)

854

855

lines += [" Consuming operators:"]

856

lines += _print_operators(self.consumer_list)

857

858

raise VelaError("\n".join(lines))

859

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

860

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

861

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

862

# checks that the scaling of two quantized tensors are equal

863

Tim Hall