Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2023-01-13 17:57:25 +0000

[diff] [blame]

1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Rickard Bolin

bc6ee58

2022-11-04 08:24:29 +0000

[diff] [blame]

16

#

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

17

# Description:

18

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

19

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

21

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

22

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

23

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

24

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

25

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

26

from typing import Dict

27

from typing import List

28

from typing import Optional

29

from typing import Tuple

30

from typing import Union

31

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

36

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

37

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

38

from .errors import UnsupportedFeatureError

39

from .errors import VelaError

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

ScratchFast = 4

LUT = 5

FSBias = 6

Size = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

118

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

119

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

120

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

121

self.value

122

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

123

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

124

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

125

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

126

self.value

127

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

128

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

129

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

130

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

131

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

132

133

134

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

141

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

143

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

144

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

145

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

146

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

147

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

148

def all():

149

return (

150

TensorSubPurpose.Standard,

151

TensorSubPurpose.DoubleBuffer,

152

TensorSubPurpose.RollingBufferX,

153

TensorSubPurpose.RollingBufferY,

154

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

159

Unknown = 0

160

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

175

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

186

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

195

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

196

new_shp = list(shp)

197

198

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

199

for i in range(-1, -len(shp) - 1, -1):

200

if new_shp[i] is not None:

201

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

205

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

206

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

207

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

211

class QuantizationParameters:

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

__slots__ = (

"min",

"max",

"num_bits",

"narrow_range",

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

217

"next_after",

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

"scale_f32",

"zero_point",

"quant_min",

"quant_max",

"quant_dim",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

224

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

225

def __init__(

226

self,

227

min: Union[float, np.ndarray, None] = None,

228

max: Union[float, np.ndarray, None] = None,

229

num_bits=None,

230

narrow_range=None,

231

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

236

self.narrow_range = narrow_range

237

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

238

# Use the 'next after' float value of scale_f32 when converting to scale and shift. It can be combined with

239

# natural rounding to perform rounding away from zero. This only affects the ofm scale and bias tensor, it has

240

# no affect on global scaling i.e. the ofm_scale register

241

self.next_after = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

242

self.scale_f32: Union[float, np.ndarray, None] = None

243

self.zero_point: Union[int, np.ndarray, None] = None

244

self.quant_min: Optional[float] = None

245

self.quant_max: Optional[float] = None

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

246

self.quant_dim: Optional[int] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

247

248

def __str__(self):

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

249

return (

250

f"<nng.QuantizationParameters min={self.min}, max={self.max}, num_bits={self.num_bits}, "

251

f"scale={self.scale_f32}, zero_point={self.zero_point}, next={self.next_after}>"

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

256

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

257

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

262

res.narrow_range = self.narrow_range

263

Rickard Bolin

2022-07-04 16:19:16 +0000

[diff] [blame]

264

res.next_after = self.next_after

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

265

res.scale_f32 = self.scale_f32

266

res.zero_point = self.zero_point

267

res.quant_min = self.quant_min

268

res.quant_max = self.quant_max

Fredrik Svedberg

2021-11-01 14:25:29 +0100

[diff] [blame]

269

res.quant_dim = self.quant_dim

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

270

return res

271

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

272

def dequantize(self, values) -> np.ndarray:

273

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

274

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

275

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

276

"""

277

Returns True if the scale and zero point of self and other are equal. If other is None then the scaling is

278

not considered equal because the tensor is assumed to not be quantised and False will be returned

279

"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

280

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

281

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

282

return False

283

284

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

285

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

286

def is_valid(self) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

287

"""Return True if the quantisation parameters have a scale and zero point"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

288

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

289

return self.scale_f32 is not None and self.zero_point is not None

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

290

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

291

def is_per_axis(self) -> bool:

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

292

"""Returns True if either the scale, zero point, minimum or maximum values have more than one value"""

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

293

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

294

for attr in ("scale_f32", "zero_point", "min", "max"):

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

295

if np.size(getattr(self, attr)) > 1:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

299

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

300

def create_const_tensor(

301

name: str,

302

shape: Shape,

Tim Hall

2023-01-13 17:57:25 +0000

[diff] [blame]

303

dtype: DataType, # datatype of the tensor

304

values: Optional[Union[np.ndarray, list]], # list-like data of some type, or scalar (skip mypy), or None

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

305

purpose: TensorPurpose = TensorPurpose.Unknown,

Tim Hall

2023-01-13 17:57:25 +0000

[diff] [blame]

306

quantization: Optional[QuantizationParameters] = None,

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

307

):

Tim Hall

2023-01-13 17:57:25 +0000

[diff] [blame]

308

assert isinstance(dtype, DataType)

309

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

310

# Tensor

311

const_tensor = Tensor(shape, dtype, name + "_0")

312

const_tensor.purpose = purpose

313

const_tensor.quantization = quantization

Tim Hall

2023-01-13 17:57:25 +0000

[diff] [blame]

314

315

# if the tensor datatype does not match that of the values then np.array() will perform a cast operation. this can

316

# result in undefined behaviour if casting from a numpy float to a numpy unsigned integer. therefore, we need to

317

# avoid this undefined behaviour by converting the numpy floats to python floats as these give the desired behaviour

318

# when casting to unsigned integers

319

if (

320

values is not None

321

and shape != [] # values are not a scalar

322

and isinstance(values[0], np.floating)

323

and dtype.type == BaseType.Unsigned

324

):

325

values = [float(v) for v in values]

326

327

const_tensor.values = np.array(values, dtype=dtype.as_numpy_type())

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

328

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

329

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

330

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

331

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

335

# class that keeps track of all tensor addresses in the different memory types

336

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

337

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

338

339

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

340

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

341

return cls.address_map[tens_id].get(mem_type)

342

343

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

344

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

345

# Check previous address if there is one

346

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

347

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

348

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

349

350

# Set tensor's address for memory type

351

cls.address_map[tens_id][mem_type] = address

352

353

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

354

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

355

class Tensor:

356

__slots__ = (

357

"shape",

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

358

"_original_shape",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

363

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

364

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

365

"ops",

366

"consumer_list",

367

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

368

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

369

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

370

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

371

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

377

"storage_compression_scale",

378

"bandwidth_compression_scale",

379

"compression_scale_for_worst_weight_stream",

380

"weight_compression_scales",

381

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

382

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

383

"storage_rounding_quantum",

384

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

385

"quantization",

386

"weight_compressed_offsets",

387

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

388

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

389

"equivalence_id",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

390

"src_tensor",

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

391

"needs_linear_format",

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

392

"ifm_write_protected",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

393

)

394

AllocationQuantum = 16

395

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

396

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

397

self.shape = shape

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

398

self._original_shape = shape

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

399

self.storage_shape = shape

400

self.bandwidth_shape = shape

401

self.dtype = dtype

402

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

403

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

404

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

405

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

406

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

407

self.ops: List[Operation] = []

408

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

409

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

410

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

411

self.compressed_values: Optional[np.ndarray] = None

412

self.compressed_values_substream_offsets: Optional[List] = None

413

self.mem_area: MemArea = MemArea.Unknown

414

self.mem_type: MemType = MemType.Unknown

415

self.format: TensorFormat = TensorFormat.Unknown

416

self.purpose: TensorPurpose = TensorPurpose.Unknown

417

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

418

self.alignment: int = Tensor.AllocationQuantum

419

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

420

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

421

self.storage_compression_scale: float = 1.0

422

self.bandwidth_compression_scale: float = 1.0

423

self.compression_scale_for_worst_weight_stream: float = 1.0

424

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

425

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

426

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

427

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

428

self.value_id: UUID = uuid.uuid4()

429

self.weight_compressed_offsets: List = []

430

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

431

self.brick_size: Tuple = (1, 1, 1, 1)

432

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

433

434

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

435

self.quantization: Optional[QuantizationParameters] = None

436

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

437

Patrik Gustavsson

ee99bb1

2021-04-08 09:04:00 +0200

[diff] [blame]

438

self.needs_linear_format = True

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

439

self.ifm_write_protected = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

440

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

441

# Reference to parent-tensor if this tensor is a clone

Jonas Ohlsson

845e232

2022-03-01 12:39:55 +0100

[diff] [blame]

442

self.src_tensor: Optional[Tensor] = None

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

443

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

444

@property

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

445

def original_shape(self):

446

return self._original_shape

447

448

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

449

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

450

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

451

452

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

453

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

454

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

455

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

456

@property

457

def is_standard_fm(self) -> bool:

458

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

459

Johan Alfvén

0f2e59f

2022-10-21 11:21:38 +0200

[diff] [blame]

460

@property

461

def is_const(self) -> bool:

462

return self.ops != [] and self.ops[0].type == Op.Const

463

464

@property

465

def is_scalar(self) -> bool:

466

return self.shape == [] and self.elements() == 1

467

468

def is_broadcast(self, ofm) -> bool:

469

return self.shape != ofm.shape

470

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

471

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

472

if self.element_size_bytes == 0:

Diqing Zhong

e3d18b0

2021-11-15 13:53:10 +0100

[diff] [blame]

473

return self.dtype.size_in_bits() // 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

474

return self.element_size_bytes

475

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

476

# Returns a copy, renamed to self.name + suffix

477

# The references to Operators will be empty when returned

478

# Depending on set_unique, the copy is shallow, or deep

479

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

480

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

481

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

482

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

483

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

484

res.storage_shape = list(self.storage_shape)

485

res.bandwidth_shape = list(self.bandwidth_shape)

486

if self.quantization is not None:

487

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

488

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

489

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

490

res.ops = []

491

res.consumer_list = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

492

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

493

return res

494

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

495

def clone_into_fast_storage(self, arch) -> "Tensor":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

496

res = self.clone(suffix="_fast_storage")

497

res.mem_area = arch.fast_storage_mem_area

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

498

res.mem_type = MemType.Scratch_fast

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

499

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

500

return res

501

Tim Hall

92cd33b

2022-11-03 12:25:33 +0000

[diff] [blame]

502

def as_1D(self):

503

self.shape = [np.prod(self.shape)]

504

if self.values is not None:

505

self.values = self.values.reshape(self.shape)

506

507

def transpose(self, reorder):

508

self.shape = [self.shape[idx] for idx in reorder]

509

self._original_shape = [self._original_shape[idx] for idx in reorder]

510

if self.values is not None:

511

self.values = self.values.transpose(reorder)

512

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

513

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

514

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

515

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

516

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

517

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

518

self.storage_shape = src_tens.storage_shape

519

self.brick_size = src_tens.brick_size

520

self.weight_compression_scales = src_tens.weight_compression_scales

521

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

522

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

523

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

524

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

525

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

526

self.block_traversal = src_tens.block_traversal

527

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

528

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

529

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

530

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

538

if shape_len > 4:

539

return

Louis Verhaard

04bd3e9

2021-08-19 16:36:32 +0200

[diff] [blame]

540

assert not (self.needs_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

541

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

542

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

543

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

544

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

545

if self.shape is None:

546

return

547

548

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

549

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

550

551

if fmt == TensorFormat.WeightsCompressed:

552

compression_ratio = 5 / 8

553

self.storage_compression_scale = compression_ratio

554

self.bandwidth_compression_scale = compression_ratio

555

self.compression_scale_for_worst_weight_stream = compression_ratio

556

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

557

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

558

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

563

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

564

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

569

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

570

return shape_fully_defined(self.shape)

571

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

572

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

573

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

574

if raw_size == 0:

575

raw_size = 1 # force it to take up space

576

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

577

return rounded_size

578

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

579

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

580

elems = shape_num_elements(op_storage_shape)

581

elems = elems if elems else 0

582

raw_size = elems * self.element_size()

583

if raw_size == 0:

584

raw_size = 1 # force it to take up space

585

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

586

return rounded_size

587

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

588

def storage_shape_for_sub_purpose(

589

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

590

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

591

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

592

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

593

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

594

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

595

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

596

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

597

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

598

if sub_purpose == TensorSubPurpose.RollingBufferX:

599

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

600

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

601

shp[0] = 1

602

shp[2] = min(shp[2], param_a)

603

elif sub_purpose == TensorSubPurpose.RollingBufferY:

604

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

605

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

606

shp[0] = 1

607

shp[1] = min(shp[1], param_a)

608

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

609

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

610

assert param_a is not None

611

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

612

shp[0] = 1

613

shp[2] = min(shp[2], param_a)

614

shp[1] = min(shp[1], param_b)

615

elif sub_purpose == TensorSubPurpose.Standard:

616

pass

617

else:

618

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

619

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

620

return shp

621

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

622

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

623

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

624

self.sub_purpose = sub_purpose

625

if sub_purpose == TensorSubPurpose.DoubleBuffer:

626

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

627

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

628

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

629

elems = shape_num_elements(self.bandwidth_shape)

630

if elems is None:

631

return 0

632

return elems * self.element_size() * self.bandwidth_compression_scale

633

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

634

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

635

return self.consumer_list

636

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

637

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

638

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

639

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

640

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

641

def addresses_for_rolling_buffer(

642

self, start_coord: Shape, end_coord: Shape, strides: List[int], op_shape4D: Shape4D

643

) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

644

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

645

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

646

if self.storage_shape == []:

return (

1,

1,

1,

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

651

[self.address_for_coordinate(start_coord, strides, op_shape4D), 0, 0, 0],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

652

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

653

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

654

if self.is_standard_fm:

655

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

656

else:

657

storage_shape_4D = Shape4D(self.storage_shape)

658

659

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

660

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

661

662

crossing_y = min(crossing_y, end_coord[1])

663

crossing_x = min(crossing_x, end_coord[2])

664

665

box_height0 = crossing_y - start_coord[1]

666

box_width = crossing_x - start_coord[2]

667

Rickard Bolin

9ae3455

2022-06-09 13:07:17 +0000

[diff] [blame]

668

addresses: List = [0] * 4

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

669

addresses[0] = self.address_for_coordinate(start_coord, strides, op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

670

671

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

672

addresses[1] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

673

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

674

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

675

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

676

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

677

addresses[2] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

678

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

679

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

680

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

681

addresses[3] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

682

[start_coord[0], crossing_y, crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

683

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

684

685

return box_height0, box_height0, box_width, addresses

686

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

687

def get_strides(self, shape4D: Optional[Shape4D]) -> List[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

688

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

689

augmented_shape = self.get_augmented_shape(shape4D)

690

assert len(augmented_shape) == 5

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

691

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

692

stride = self.element_size() * self.storage_compression_scale

693

694

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

695

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

696

for i in stride_order:

697

strides[i] = stride

698

stride *= augmented_shape[i]

699

else:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

700

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

701

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

702

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

703

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

704

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

705

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

706

return strides

707

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

708

def get_augmented_shape(self, shape4D: Optional[Shape4D] = None) -> Optional[Shape]:

709

710

if shape4D and self.is_standard_fm:

711

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

712

else:

713

augmented_shape = full_shape(4, self.storage_shape, 1)

714

715

if self.format == TensorFormat.NHWC:

716

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

717

718

elif self.format == TensorFormat.NHCWB16:

719

augmented_shape = augmented_shape[0:4] + [1]

720

721

if augmented_shape[1] == 0:

722

augmented_shape[1] = 1

723

724

else:

725

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

726

return None

727

728

return augmented_shape

729

730

def get_augmented_coord(self, coord: Optional[Shape] = None) -> Optional[Shape]:

731

if coord is None:

732

coord = [0] * min(len(self.storage_shape), 4)

733

734

missing_len = 4 - len(coord)

735

augmented_coord = ([0] * missing_len) + coord

736

737

if self.format == TensorFormat.NHWC:

738

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

739

740

elif self.format == TensorFormat.NHCWB16:

741

channel_divisor = 16

742

augmented_coord = (

743

[augmented_coord[0], augmented_coord[3] // channel_divisor]

744

+ augmented_coord[1:3]

745

+ [augmented_coord[3] % channel_divisor]

746

)

747

else:

748

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

749

return None

750

751

return augmented_coord

752

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

753

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

754

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

755

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

756

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

757

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

758

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

759

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

760

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

761

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

762

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

763

assert len(self.compressed_values) > 0

764

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

765

766

depth = coord[-1]

767

brick_depth = self.brick_size[-1]

768

# Clamp position at final element index

769

if depth > self.shape[-1]:

770

depth = self.shape[-1]

771

772

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

773

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

774

775

# Check boundaries on all but last weight set (which may be shorter

776

# than the brick we divided it up into)

777

if index < len(self.weight_compressed_offsets) - 1:

778

# There are no half-way points in the weights

779

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

780

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

784

def size_of_compressed_stream(self, index: int) -> int:

785

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

786

assert 0 <= index < len(self.compressed_values)

787

return len(self.compressed_values[index])

788

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

789

def is_last_index_in_compressed_stream(self, index: int) -> bool:

790

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

791

assert 0 <= index < len(self.compressed_values)

792

return index == len(self.compressed_values) - 1

793

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

794

def address_for_coordinate(

795

self,

796

orig_coord: Shape,

797

strides: Optional[List[int]] = None,

798

op_shape4D: Optional[Shape4D] = None,

799

is_top_box: bool = False,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

800

) -> Optional[int]:

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

801

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

802

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

803

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

804

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

805

# Strides may be passed as an argument, for example when creating feature maps as the strides may be modified

806

# by the "ofm_stride_multiplier" operation attribute. If not, they are calculated here.

807

if not strides:

808

strides = self.get_strides(op_shape4D)

coord = orig_coord

if is_top_box:

coord = [c - 1 for c in orig_coord]

813

address_offset += 1 * strides[-1] # one element

814

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

815

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

816

shape = op_shape4D.as_list() if op_shape4D else self.shape

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

817

for _coord, _shape in zip(coord, shape):

818

assert _coord >= 0 and _coord < _shape

819

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

820

if op_shape4D and self.is_standard_fm:

821

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

822

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

823

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

824

storage_shape = self.storage_shape

825

coord = coord[-len(storage_shape) :]

826

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

827

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

828

# Handle wraparound for partial buffers. Make sure to do this after subtracting top box

829

coord = [_coord % _shape for _coord, _shape in zip(coord, storage_shape)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

830

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

831

augmented_coord = self.get_augmented_coord(coord)

832

assert augmented_coord is not None

833

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

834

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

835

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

836

assert address_offset >= 0 and address_offset <= storage_size

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

837

return self.address + address_offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

838

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

839

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

840

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

841

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

842

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

843

return self.equivalence_id == tens.equivalence_id

844

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

845

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

846

self.shape = shape

847

self.storage_shape = shape

848

self.bandwidth_shape = shape

849

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

850

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

851

d = len(self.shape)

852

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

853

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

854

elif d == 2:

855

return [self.shape[0], 1, 1, self.shape[1]]

856

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

857

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

858

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

859

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

860

# a tensor is quantized if it has an integral type and it contains valid quantization params

861

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

862

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

863

return False

864

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

865

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

866

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

867

def get_scalar(self):

868

"""

869

return: Unquantized or dequantized scalar value

870

rtype: self.dtype (if unquantized) or float (if dequantized)

871

"""

872

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

873

if self.is_quantized():

874

return self.quantization.dequantize(self.values).item(0)

875

else:

876

return self.values.item(0)

877

Ayaan Masood

a2ec5aa

2022-04-21 14:28:03 +0100

[diff] [blame]

878

def get_shape_as_2d(self, dimension_2_size: int) -> Optional[Shape4D]:

879

880

elms = self.elements()

881

dimension_1_size = elms // dimension_2_size

882

# Checks if the reduction works and shape is not 1D

883

is_reducible = dimension_1_size * dimension_2_size == elms and not (len(self.shape) == 1)

new_shape = None

if is_reducible:

new_shape = Shape4D([dimension_1_size, 1, 1, dimension_2_size])

return new_shape

Louis Verhaard

2020-12-17 13:54:09 +0100

[diff] [blame]

891

def __lt__(self, other: "Tensor") -> bool:

892

return self.equivalence_id < other.equivalence_id

893

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

894

def __str__(self):

895

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

896

897

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

898

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

899

def error(self, msg):

900

"""

901

Raises a VelaError exception for errors encountered when parsing a Tensor

902

903

:param self: Tensor object that resulted in the error

904

:param msg: str object that contains a description of the specific error encountered

905

"""

906

907

def _print_operators(ops):

908

lines = []

909

for idx, op in enumerate(ops):

910

op_type = getattr(op, "type", "Not an Operation")

911

op_id = getattr(op, "op_index", "-")

912

lines.append(f" {idx} = {op_type} ({op_id})")

913

return lines

914

915

lines = [f"Invalid {self.name} tensor. {msg}"]

916

917

lines += [" Driving operators:"]

918

lines += _print_operators(self.ops)

919

920

lines += [" Consuming operators:"]

921

lines += _print_operators(self.consumer_list)

922

923

raise VelaError("\n".join(lines))

924

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

925

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

926

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

927

# checks that the scaling of two quantized tensors are equal

928

Tim Hall