Blame - ethosu/vela/tensor.py - ml/ethos-u/ethos-u-vela

2023-01-13 17:57:25 +0000

[diff] [blame]

1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Rickard Bolin

bc6ee58

2022-11-04 08:24:29 +0000

[diff] [blame]

16

#

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

17

# Description:

18

# Internal representation of a Neural Network Tensor.

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

19

import copy

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

21

import uuid

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

22

from collections import defaultdict

Diqing Zhong

f842b69

2020-12-11 13:07:37 +0100

[diff] [blame]

23

from enum import auto

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

24

from functools import lru_cache

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

25

from functools import total_ordering

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

26

from typing import Dict

27

from typing import List

28

from typing import Optional

29

from typing import Tuple

30

from typing import Union

31

from uuid import UUID

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

import numpy as np

from . import numeric_util

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

36

from .data_type import BaseType

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

37

from .data_type import DataType

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

38

from .errors import UnsupportedFeatureError

39

from .errors import VelaError

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

40

from .numeric_util import full_shape

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

41

from .operation import Op

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

42

from .operation import Operation

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

43

from .shape4d import Shape4D

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

44

45

Shape = List

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

46

47

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

48

class MemType(enum.IntFlag):

Unknown = 0

Permanent_NPU = 1

Permanent_CPU = 2

Scratch = 3

Scratch_fast = 4

Size = Scratch_fast + 1

55

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

56

def display_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

57

return ("Unknown", "Permanent_NPU", "Permanent_CPU", "Scratch", "Scratch_fast", "Size")[self.value]

58

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

59

def identifier_name(self) -> str:

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

60

return ("unknown", "permanent_npu", "permanent_cpu", "scratch", "scratch_fast", "size")[self.value]

61

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

62

@staticmethod

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

63

def all():

64

return (MemType.Permanent_NPU, MemType.Permanent_CPU, MemType.Scratch, MemType.Scratch_fast)

def __str__(self):

return self.name

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

70

class BandwidthDirection(enum.IntEnum):

Read = 0

Write = auto()

Size = auto()

def display_name(self):

76

return self.name

77

78

def identifier_name(self):

79

return self.name.lower()

@staticmethod

def all():

return (BandwidthDirection.Read, BandwidthDirection.Write)

84

85

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

86

class MemArea(enum.IntFlag):

Unknown = 0

Sram = 1

Dram = 2

OnChipFlash = 3

OffChipFlash = 4

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

92

Shram = 5 # for LUT

93

Size = Shram + 1

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

94

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

95

def display_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

96

return ("Unknown", "SRAM", "DRAM", "On-chip Flash", "Off-chip Flash", "SHRAM", "Size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

97

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

98

def identifier_name(self) -> str:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

99

return ("unknown", "sram", "dram", "on_chip_flash", "off_chip_flash", "shram", "size")[self.value]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

100

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

101

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

102

def all():

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

103

return (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash, MemArea.Shram)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

def __str__(self):

return self.name

class TensorPurpose(enum.IntFlag):

Unknown = 0

Weights = 1

FeatureMap = 2

Scratch = 3

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

114

ScratchFast = 4

115

LUT = 5

116

FSBias = 6

Johan Alfven

9070f0f

2023-02-07 13:01:03 +0100

[diff] [blame]

117

Virtual = 7

118

Size = 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

119

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

120

def display_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

121

return ("Unknown", "Weights", "FeatureMap", "Scratch", "ScratchFast", "LUT", "FastStorageBias", "Size")[

122

self.value

123

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

124

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

125

def identifier_name(self) -> str:

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

126

return ("unknown", "weights", "feature_map", "scratch", "scratch_fast", "lut", "fast_storage_bias", "size")[

127

self.value

128

]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

129

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

130

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

131

def all():

Andreas Nevalainen

897cc14

2020-10-28 15:42:08 +0100

[diff] [blame]

132

return (TensorPurpose.Weights, TensorPurpose.FeatureMap, TensorPurpose.FSBias)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

133

134

135

class TensorSubPurpose(enum.Enum):

Standard = 0

DoubleBuffer = 1

RollingBufferX = 2

RollingBufferY = 3

RollingBufferXY = 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

142

def display_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

143

return ("Standard", "Double Buffer", "Rolling Buffer X", "Rolling Buffer Y", "Rolling Buffer XY")[self.value]

144

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

145

def identifier_name(self) -> str:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

146

return ("standard", "double_buffer", "rolling_buffer_x", "rolling_buffer_y", "rolling_buffer_xy")[self.value]

147

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

148

@staticmethod

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

149

def all():

150

return (

151

TensorSubPurpose.Standard,

152

TensorSubPurpose.DoubleBuffer,

153

TensorSubPurpose.RollingBufferX,

154

TensorSubPurpose.RollingBufferY,

155

TensorSubPurpose.RollingBufferXY,

)

class TensorFormat(enum.Flag):

160

Unknown = 0

161

WeightsCompressed = 1

NHWC = 2

NHCWB16 = 3

def __str__(self):

return self.name

class TensorBlockTraversal(enum.Enum):

Default = 0

DepthWise = 1

DepthFirst = 2

PartKernelFirst = 3

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

176

def shape_num_elements(shp: Shape) -> Optional[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

elems = 1

if shp is None:

return None

for d in shp:

if d is None:

return None

elems *= d

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

187

def shape_fully_defined(shp: Shape) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

if shp is None:

return False

for d in shp:

if d is None:

return False

return True

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

196

def shape_round_to_quantum(shp: Shape, quantum: Tuple) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

197

new_shp = list(shp)

198

199

# Traverse backwards using length of shape since there may be more rounding quantums than shape elements

200

for i in range(-1, -len(shp) - 1, -1):

201

if new_shp[i] is not None:

202

new_shp[i] = numeric_util.round_up(new_shp[i], quantum[i])

return new_shp

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

206

@lru_cache(maxsize=None)

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

207

def create_equivalence_id(key) -> UUID:

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

208

# Generates equivalence_id based on the given key.

return uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

212

class QuantizationParameters:

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

__slots__ = (

"min",

"max",

"num_bits",

"narrow_range",

"scale_f32",

"zero_point",

"quant_min",

"quant_max",

"quant_dim",

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

224

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

225

def __init__(

226

self,

227

min: Union[float, np.ndarray, None] = None,

228

max: Union[float, np.ndarray, None] = None,

229

num_bits=None,

230

narrow_range=None,

Johan Alfven

347c57b

2023-04-03 15:29:13 +0200

[diff] [blame]

231

scale_f32: Union[float, np.ndarray, None] = None,

232

zero_point: Union[int, np.ndarray, None] = None,

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

233

):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.min = min

self.max = max

self.num_bits = num_bits

238

self.narrow_range = narrow_range

239

Johan Alfven

347c57b

2023-04-03 15:29:13 +0200

[diff] [blame]

240

self.scale_f32: Union[float, np.ndarray, None] = scale_f32

241

self.zero_point: Union[int, np.ndarray, None] = zero_point

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

242

self.quant_min: Optional[float] = None

243

self.quant_max: Optional[float] = None

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

244

self.quant_dim: Optional[int] = None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

245

246

def __str__(self):

Rickard Bolin

fea1516

2022-07-04 16:19:16 +0000

[diff] [blame]

247

return (

248

f"<nng.QuantizationParameters min={self.min}, max={self.max}, num_bits={self.num_bits}, "

Tim Hall

5ff4cd1

2023-05-16 22:39:14 +0100

[diff] [blame]

249

f"scale={self.scale_f32}, zero_point={self.zero_point}>"

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

)

__repr__ = __str__

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

254

def clone(self) -> "QuantizationParameters":

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

255

res = QuantizationParameters()

res.min = self.min

res.max = self.max

res.num_bits = self.num_bits

260

res.narrow_range = self.narrow_range

261

262

res.scale_f32 = self.scale_f32

263

res.zero_point = self.zero_point

264

res.quant_min = self.quant_min

265

res.quant_max = self.quant_max

Fredrik Svedberg

cc8569f

2021-11-01 14:25:29 +0100

[diff] [blame]

266

res.quant_dim = self.quant_dim

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

267

return res

268

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

269

def dequantize(self, values) -> np.ndarray:

270

return np.subtract(values, self.zero_point) * self.scale_f32

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

271

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

272

def is_scaling_equal(self, other: Optional["QuantizationParameters"]) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

273

"""

274

Returns True if the scale and zero point of self and other are equal. If other is None then the scaling is

275

not considered equal because the tensor is assumed to not be quantised and False will be returned

276

"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

277

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

278

if not isinstance(other, QuantizationParameters):

Tim Hall

e3786ac

2020-07-28 17:40:50 +0100

[diff] [blame]

279

return False

280

281

return self.scale_f32 == other.scale_f32 and self.zero_point == other.zero_point

282

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

283

def is_valid(self) -> bool:

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

284

"""Return True if the quantisation parameters have a scale and zero point"""

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

285

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

286

return self.scale_f32 is not None and self.zero_point is not None

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

287

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

288

def is_per_axis(self) -> bool:

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

289

"""Returns True if either the scale, zero point, minimum or maximum values have more than one value"""

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

290

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

291

for attr in ("scale_f32", "zero_point", "min", "max"):

Dwight Lidman

4caf29d

2021-10-08 14:26:54 +0200

[diff] [blame]

292

if np.size(getattr(self, attr)) > 1:

Dwight Lidman

c718743

2020-11-16 17:40:46 +0100

[diff] [blame]

return True

return False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

296

Johan Alfven

9070f0f

2023-02-07 13:01:03 +0100

[diff] [blame]

297

def create_virtual_tensor(

298

name: str,

299

):

300

virtual_tensor = Tensor([], DataType.int8, name)

301

virtual_tensor.purpose = TensorPurpose.Virtual

302

return virtual_tensor

303

304

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

305

def create_const_tensor(

306

name: str,

307

shape: Shape,

Tim Hall

2023-01-13 17:57:25 +0000

[diff] [blame]

308

dtype: DataType, # datatype of the tensor

309

values: Optional[Union[np.ndarray, list]], # list-like data of some type, or scalar (skip mypy), or None

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

310

purpose: TensorPurpose = TensorPurpose.Unknown,

Tim Hall

2023-01-13 17:57:25 +0000

[diff] [blame]

311

quantization: Optional[QuantizationParameters] = None,

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

312

):

Tim Hall

2023-01-13 17:57:25 +0000

[diff] [blame]

313

assert isinstance(dtype, DataType)

314

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

315

# Tensor

316

const_tensor = Tensor(shape, dtype, name + "_0")

317

const_tensor.purpose = purpose

318

const_tensor.quantization = quantization

Tim Hall

2023-01-13 17:57:25 +0000

[diff] [blame]

319

320

# if the tensor datatype does not match that of the values then np.array() will perform a cast operation. this can

321

# result in undefined behaviour if casting from a numpy float to a numpy unsigned integer. therefore, we need to

322

# avoid this undefined behaviour by converting the numpy floats to python floats as these give the desired behaviour

323

# when casting to unsigned integers

324

if (

325

values is not None

326

and shape != [] # values are not a scalar

327

and isinstance(values[0], np.floating)

328

and dtype.type == BaseType.Unsigned

329

):

330

values = [float(v) for v in values]

331

Raul Farkas

5442544

2023-04-19 15:06:51 +0100

[diff] [blame]

332

const_tensor.values = np.array(values).astype(dtype.as_numpy_type())

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

333

# Operator

Louis Verhaard

aee5d75

2020-09-30 09:01:52 +0200

[diff] [blame]

334

const_op = Operation(Op.Const, name)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

335

const_op.set_output_tensor(const_tensor)

patrik.gustavsson

eeb8515

2020-12-21 17:10:40 +0000

[diff] [blame]

336

const_op.set_ifm_ofm_shapes()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

return const_tensor

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

340

# class that keeps track of all tensor addresses in the different memory types

341

class TensorAddressMap:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

342

address_map: Dict = defaultdict(dict) # dict (tens.equivalence_id -> dict (mem_type -> address))

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

343

344

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

345

def get_address_for_tens(cls, tens_id: UUID, mem_type: MemType) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

346

return cls.address_map[tens_id].get(mem_type)

347

348

@classmethod

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

349

def set_address_for_tens(cls, tens_id: UUID, mem_type: MemType, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

350

# Check previous address if there is one

351

previous_address = cls.address_map[tens_id].get(mem_type)

Louis Verhaard

0b9c9a3

2020-09-15 14:05:38 +0200

[diff] [blame]

352

if address is not None and previous_address is not None:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

353

assert previous_address == address, "Two different addresses cannot be assigned to the same tensor."

354

355

# Set tensor's address for memory type

356

cls.address_map[tens_id][mem_type] = address

357

358

Louis Verhaard

6c74c3b

2020-12-17 13:54:09 +0100

[diff] [blame]

359

@total_ordering

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

360

class Tensor:

361

__slots__ = (

362

"shape",

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

363

"_original_shape",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"storage_shape",

"bandwidth_shape",

"dtype",

"name",

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

368

"is_variable",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

369

"pre_buffer",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

370

"ops",

371

"consumer_list",

372

"values",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

373

"compressed_values",

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

374

"compressed_values_substream_offsets",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

375

"mem_area",

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

376

"mem_type",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

"format",

"purpose",

"sub_purpose",

"alignment",

"weight_transpose_depthwise",

382

"storage_compression_scale",

383

"bandwidth_compression_scale",

384

"compression_scale_for_worst_weight_stream",

385

"weight_compression_scales",

386

"weight_compression_config",

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

387

"value_id",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

388

"storage_rounding_quantum",

389

"brick_size",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

390

"quantization",

391

"weight_compressed_offsets",

392

"element_size_bytes",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

393

"block_traversal",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

394

"equivalence_id",

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

395

"src_tensor",

Raul Farkas

2023-03-16 16:38:05 +0000

[diff] [blame]

396

"force_linear_format",

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

397

"ifm_write_protected",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

398

)

399

AllocationQuantum = 16

400

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

401

def __init__(self, shape: Shape, dtype: DataType, name: str):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

402

self.shape = shape

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

403

self._original_shape = shape

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

404

self.storage_shape = shape

405

self.bandwidth_shape = shape

406

self.dtype = dtype

407

self.name = name

Fredrik Svedberg

8d0f489

2021-02-16 21:59:50 +0100

[diff] [blame]

408

self.is_variable = False

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

409

self.pre_buffer = False

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

410

self.equivalence_id: UUID = uuid.uuid4()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

411

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

412

self.ops: List[Operation] = []

413

self.consumer_list: List[Operation] = []

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

414

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

415

self.values: Optional[np.ndarray] = None # elements are of type self.dtype

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

416

self.compressed_values: Optional[np.ndarray] = None

417

self.compressed_values_substream_offsets: Optional[List] = None

418

self.mem_area: MemArea = MemArea.Unknown

419

self.mem_type: MemType = MemType.Unknown

420

self.format: TensorFormat = TensorFormat.Unknown

421

self.purpose: TensorPurpose = TensorPurpose.Unknown

422

self.sub_purpose: TensorSubPurpose = TensorSubPurpose.Standard

423

self.alignment: int = Tensor.AllocationQuantum

424

self.weight_transpose_depthwise: bool = False

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

425

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

426

self.storage_compression_scale: float = 1.0

427

self.bandwidth_compression_scale: float = 1.0

428

self.compression_scale_for_worst_weight_stream: float = 1.0

429

self.weight_compression_scales: Optional[np.ndarray] = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

430

# if two tensors have the same weight_compression_config, then they have the same compressed values

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

431

self.weight_compression_config = None

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

432

# if two tensors have the same value_id, then they have the same values

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

433

self.value_id: UUID = uuid.uuid4()

434

self.weight_compressed_offsets: List = []

435

self.storage_rounding_quantum: Tuple = (1, 1, 1, 1)

436

self.brick_size: Tuple = (1, 1, 1, 1)

437

self.element_size_bytes: int = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

438

439

# quantization parameters

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

440

self.quantization: Optional[QuantizationParameters] = None

441

self.block_traversal: TensorBlockTraversal = TensorBlockTraversal.Default

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

442

Raul Farkas

2023-03-16 16:38:05 +0000

[diff] [blame]

443

# Keep track of whether the linear format should be enforced

444

self.force_linear_format: Optional[bool] = None

Johan Alfvén

8d57aaa

2022-02-04 11:19:17 +0100

[diff] [blame]

445

self.ifm_write_protected = False

Patrik Gustavsson

458a208

2020-08-13 13:41:05 +0200

[diff] [blame]

446

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

447

# Reference to parent-tensor if this tensor is a clone

Jonas Ohlsson

845e232

2022-03-01 12:39:55 +0100

[diff] [blame]

448

self.src_tensor: Optional[Tensor] = None

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

449

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

450

@property

Raul Farkas

2023-03-16 16:38:05 +0000

[diff] [blame]

451

def use_linear_format(self) -> bool:

452

"""Return whether the tensor should use linear format or not."""

453

return self.force_linear_format in (True, None)

454

455

@property

Johan Alfvén

b9f8159

2022-10-31 14:39:02 +0100

[diff] [blame]

456

def original_shape(self):

457

return self._original_shape

458

459

@property

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

460

def address(self) -> int:

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

461

return TensorAddressMap.get_address_for_tens(self.equivalence_id, self.mem_type)

462

463

@address.setter

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

464

def address(self, address: int):

Jacob Bohlin

2020-09-11 10:04:15 +0200

[diff] [blame]

465

TensorAddressMap.set_address_for_tens(self.equivalence_id, self.mem_type, address)

466

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

467

@property

468

def is_standard_fm(self) -> bool:

469

return self.sub_purpose == TensorSubPurpose.Standard and self.purpose == TensorPurpose.FeatureMap

470

Johan Alfvén

0f2e59f

2022-10-21 11:21:38 +0200

[diff] [blame]

471

@property

472

def is_const(self) -> bool:

473

return self.ops != [] and self.ops[0].type == Op.Const

474

475

@property

476

def is_scalar(self) -> bool:

477

return self.shape == [] and self.elements() == 1

478

479

def is_broadcast(self, ofm) -> bool:

480

return self.shape != ofm.shape

481

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

482

def element_size(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

483

if self.element_size_bytes == 0:

Diqing Zhong

e3d18b0

2021-11-15 13:53:10 +0100

[diff] [blame]

484

return self.dtype.size_in_bits() // 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

485

return self.element_size_bytes

486

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

487

# Returns a copy, renamed to self.name + suffix

488

# The references to Operators will be empty when returned

489

# Depending on set_unique, the copy is shallow, or deep

490

# For set_unique==True, a new equivalence_id will be set

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

491

def clone(self, suffix="_clone", set_unique: bool = False) -> "Tensor":

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

492

res = copy.copy(self)

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

493

if set_unique:

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

494

res.equivalence_id = uuid.uuid4()

erik.andersson@arm.com

42b94ed

2021-02-11 14:02:08 +0100

[diff] [blame]

495

res.storage_shape = list(self.storage_shape)

496

res.bandwidth_shape = list(self.bandwidth_shape)

497

if self.quantization is not None:

498

res.quantization = self.quantization.clone()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

499

Patrik Gustavsson

2020-11-04 12:43:50 +0100

[diff] [blame]

500

res.name = res.name + suffix

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

501

res.ops = []

502

res.consumer_list = []

Johan Alfven

c4268bf

2023-04-13 10:13:56 +0200

[diff] [blame]

503

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

504

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

505

return res

506

Johan Alfven

126558e

2023-03-09 08:36:10 +0100

[diff] [blame]

507

def clone_into_shram(self, arch) -> "Tensor":

508

res = self.clone(suffix="_shram")

509

res.mem_area = MemArea.Shram

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

510

res.src_tensor = self

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

511

return res

512

Tim Hall

92cd33b

2022-11-03 12:25:33 +0000

[diff] [blame]

513

def as_1D(self):

514

self.shape = [np.prod(self.shape)]

515

if self.values is not None:

516

self.values = self.values.reshape(self.shape)

517

518

def transpose(self, reorder):

519

self.shape = [self.shape[idx] for idx in reorder]

520

self._original_shape = [self._original_shape[idx] for idx in reorder]

521

if self.values is not None:

522

self.values = self.values.transpose(reorder)

523

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

524

def copy_compressed_weight_info(self, src_tens: "Tensor"):

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

525

# Copies compressed values + all related weight compression info from the given tensor

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

526

self.equivalence_id = src_tens.equivalence_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

527

self.compressed_values = src_tens.compressed_values

Tim Hall

f7e810a

2020-06-25 15:04:31 +0100

[diff] [blame]

528

self.compressed_values_substream_offsets = src_tens.compressed_values_substream_offsets

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

529

self.storage_shape = src_tens.storage_shape

530

self.brick_size = src_tens.brick_size

531

self.weight_compression_scales = src_tens.weight_compression_scales

532

self.weight_compressed_offsets = src_tens.weight_compressed_offsets

533

self.weight_transpose_depthwise = src_tens.weight_transpose_depthwise

534

self.compression_scale_for_worst_weight_stream = src_tens.compression_scale_for_worst_weight_stream

535

self.storage_compression_scale = src_tens.storage_compression_scale

Diqing Zhong

7e1d1d1

2020-10-30 15:10:46 +0100

[diff] [blame]

536

self.bandwidth_compression_scale = src_tens.bandwidth_compression_scale

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

537

self.block_traversal = src_tens.block_traversal

538

self.weight_compression_config = src_tens.weight_compression_config

Louis Verhaard

2020-09-23 10:27:11 +0200

[diff] [blame]

539

self.value_id = src_tens.value_id

Louis Verhaard

2020-05-07 08:12:58 +0200

[diff] [blame]

540

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

541

def set_format(self, fmt: TensorFormat, arch):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.format = fmt

shape_len = 0

try:

shape_len = len(self.shape)

except TypeError:

pass

Louis Verhaard

2020-11-16 16:37:11 +0100

[diff] [blame]

549

if shape_len > 4:

550

return

Raul Farkas

2023-03-16 16:38:05 +0000

[diff] [blame]

551

assert not (self.use_linear_format and fmt == TensorFormat.NHCWB16)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

552

self.storage_rounding_quantum = arch.storage_rounding_quantums[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

553

self.storage_rounding_quantum = tuple(self.storage_rounding_quantum[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

554

self.brick_size = arch.brick_sizes[self.format]

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

555

self.brick_size = tuple(self.brick_size[-shape_len:])

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

556

if self.shape is None:

557

return

558

559

self.bandwidth_shape = shape_round_to_quantum(self.shape, self.brick_size)

560

self.storage_shape = shape_round_to_quantum(self.shape, self.storage_rounding_quantum)

561

562

if fmt == TensorFormat.WeightsCompressed:

563

compression_ratio = 5 / 8

564

self.storage_compression_scale = compression_ratio

565

self.bandwidth_compression_scale = compression_ratio

566

self.compression_scale_for_worst_weight_stream = compression_ratio

567

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

568

def storage_elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

569

elems = shape_num_elements(self.storage_shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

574

def elements(self) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

575

elems = shape_num_elements(self.shape)

if elems is None:

return 0

return elems

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

580

def has_fully_defined_shape(self) -> bool:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

581

return shape_fully_defined(self.shape)

582

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

583

def storage_size(self, scale: float = 1.0) -> int:

Patrik Gustavsson

90831bc

2020-08-24 16:26:11 +0200

[diff] [blame]

584

raw_size = self.storage_elements() * self.element_size() * scale

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

585

if raw_size == 0:

586

raw_size = 1 # force it to take up space

587

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

588

return rounded_size

589

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

590

def storage_size_for_shape(self, op_storage_shape: Shape) -> int:

591

elems = shape_num_elements(op_storage_shape)

592

elems = elems if elems else 0

593

raw_size = elems * self.element_size()

594

if raw_size == 0:

595

raw_size = 1 # force it to take up space

596

rounded_size = numeric_util.round_up(numeric_util.round_up_to_int(raw_size), self.alignment)

597

return rounded_size

598

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

599

def storage_shape_for_sub_purpose(

600

self, sub_purpose: TensorSubPurpose, param_a: Optional[int], param_b: Optional[int]

601

) -> Shape:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

602

if sub_purpose == TensorSubPurpose.DoubleBuffer:

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

603

shp = list(self.shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

604

assert len(shp) >= 2

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

605

assert param_a is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

606

shp[-1] = min(shp[-1], param_a * 2)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

607

else:

Jacob Bohlin

fad7204

2021-08-24 21:51:41 +0200

[diff] [blame]

608

shp = full_shape(4, self.storage_shape, 1)

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

609

if sub_purpose == TensorSubPurpose.RollingBufferX:

610

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

611

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

612

shp[0] = 1

613

shp[2] = min(shp[2], param_a)

614

elif sub_purpose == TensorSubPurpose.RollingBufferY:

615

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

616

assert param_a is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

617

shp[0] = 1

618

shp[1] = min(shp[1], param_a)

619

elif sub_purpose == TensorSubPurpose.RollingBufferXY:

620

assert len(shp) == 4

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

621

assert param_a is not None

622

assert param_b is not None

Jacob Bohlin

2020-06-23 12:12:56 +0200

[diff] [blame]

623

shp[0] = 1

624

shp[2] = min(shp[2], param_a)

625

shp[1] = min(shp[1], param_b)

626

elif sub_purpose == TensorSubPurpose.Standard:

627

pass

628

else:

629

assert 0, "did not expect new sub purpose %s" % (sub_purpose,)

630

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

631

return shp

632

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

633

def set_new_sub_purpose(self, sub_purpose: TensorSubPurpose, param_a=None, param_b=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

634

self.storage_shape = self.storage_shape_for_sub_purpose(sub_purpose, param_a, param_b)

635

self.sub_purpose = sub_purpose

636

if sub_purpose == TensorSubPurpose.DoubleBuffer:

637

self.storage_compression_scale = self.compression_scale_for_worst_weight_stream

638

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

639

def bandwidth(self) -> float:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

640

elems = shape_num_elements(self.bandwidth_shape)

641

if elems is None:

642

return 0

643

return elems * self.element_size() * self.bandwidth_compression_scale

644

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

645

def consumers(self) -> List[Operation]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

646

return self.consumer_list

647

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

648

def get_4D_storage_shape_for_shape(self, op_shape4D: Shape4D) -> Shape4D:

649

rounding_quantum = full_shape(4, list(self.storage_rounding_quantum), 1)

650

return Shape4D(shape_round_to_quantum(op_shape4D.as_list(), rounding_quantum))

651

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

652

def addresses_for_rolling_buffer(

653

self, start_coord: Shape, end_coord: Shape, strides: List[int], op_shape4D: Shape4D

654

) -> Tuple:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

655

# returns ( box_height0, box_height1, box_width, [address_tl, address_tr, address_bl, address_br] )

656

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

657

if self.storage_shape == []:

return (

1,

1,

1,

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

662

[self.address_for_coordinate(start_coord, strides, op_shape4D), 0, 0, 0],

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

663

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

664

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

665

if self.is_standard_fm:

666

storage_shape_4D = self.get_4D_storage_shape_for_shape(op_shape4D)

667

else:

668

storage_shape_4D = Shape4D(self.storage_shape)

669

670

crossing_y = numeric_util.round_up(start_coord[1] + 1, storage_shape_4D.height)

671

crossing_x = numeric_util.round_up(start_coord[2] + 1, storage_shape_4D.width)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

672

673

crossing_y = min(crossing_y, end_coord[1])

674

crossing_x = min(crossing_x, end_coord[2])

675

676

box_height0 = crossing_y - start_coord[1]

677

box_width = crossing_x - start_coord[2]

678

Rickard Bolin

9ae3455

2022-06-09 13:07:17 +0000

[diff] [blame]

679

addresses: List = [0] * 4

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

680

addresses[0] = self.address_for_coordinate(start_coord, strides, op_shape4D)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

681

682

if end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

683

addresses[1] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

684

[start_coord[0], start_coord[1], crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

685

)

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

686

raise UnsupportedFeatureError("Striping in vertical direction is not supported")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

687

if end_coord[1] > crossing_y:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

688

addresses[2] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

689

[start_coord[0], crossing_y, start_coord[2], start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

690

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

691

if end_coord[1] > crossing_y and end_coord[2] > crossing_x:

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

692

addresses[3] = self.address_for_coordinate(

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

693

[start_coord[0], crossing_y, crossing_x, start_coord[3]], strides, op_shape4D

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

694

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

695

696

return box_height0, box_height0, box_width, addresses

697

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

698

def get_strides(self, shape4D: Optional[Shape4D]) -> List[int]:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

699

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

700

augmented_shape = self.get_augmented_shape(shape4D)

701

assert len(augmented_shape) == 5

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

702

strides: List = [0] * len(augmented_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

703

stride = self.element_size() * self.storage_compression_scale

704

705

if self.format != TensorFormat.NHCWB16:

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

706

stride_order = [4, 1, 3, 2, 0]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

707

for i in stride_order:

708

strides[i] = stride

709

stride *= augmented_shape[i]

710

else:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

711

strides[4] = stride

Patrik Gustavsson

2213e90

2020-05-05 17:49:35 +0200

[diff] [blame]

712

strides[3] = 16 * stride # STRIDE_X

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

713

strides[1] = strides[3] * augmented_shape[2] # STRIDE_C

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

714

strides[2] = augmented_shape[2] * augmented_shape[3] * stride # STRIDE_Y

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

715

strides[0] = strides[2] * augmented_shape[1] # STRIDE_N

716

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

717

return strides

718

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

719

def get_augmented_shape(self, shape4D: Optional[Shape4D] = None) -> Optional[Shape]:

720

721

if shape4D and self.is_standard_fm:

722

augmented_shape = self.get_4D_storage_shape_for_shape(shape4D).as_list()

723

else:

724

augmented_shape = full_shape(4, self.storage_shape, 1)

725

726

if self.format == TensorFormat.NHWC:

727

augmented_shape = [augmented_shape[0], augmented_shape[3]] + augmented_shape[1:3] + [1]

728

729

elif self.format == TensorFormat.NHCWB16:

730

augmented_shape = augmented_shape[0:4] + [1]

731

732

if augmented_shape[1] == 0:

733

augmented_shape[1] = 1

734

735

else:

736

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

737

return None

738

739

return augmented_shape

740

741

def get_augmented_coord(self, coord: Optional[Shape] = None) -> Optional[Shape]:

742

if coord is None:

743

coord = [0] * min(len(self.storage_shape), 4)

744

745

missing_len = 4 - len(coord)

746

augmented_coord = ([0] * missing_len) + coord

747

748

if self.format == TensorFormat.NHWC:

749

augmented_coord = [augmented_coord[0], augmented_coord[3]] + augmented_coord[1:3] + [0]

750

751

elif self.format == TensorFormat.NHCWB16:

752

channel_divisor = 16

753

augmented_coord = (

754

[augmented_coord[0], augmented_coord[3] // channel_divisor]

755

+ augmented_coord[1:3]

756

+ [augmented_coord[3] % channel_divisor]

757

)

758

else:

759

assert self.format in (TensorFormat.Unknown, TensorFormat.WeightsCompressed)

760

return None

761

762

return augmented_coord

763

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

764

def find_npu_op(self) -> Optional[Operation]:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

765

# Returns the NPU operator that uses this tensor

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

766

for op in self.consumers():

Dwight Lidman

940fdee

2020-08-13 13:11:48 +0200

[diff] [blame]

767

if op.run_on_npu:

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

768

return op

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

769

return None

Louis Verhaard

2020-06-04 15:51:24 +0200

[diff] [blame]

770

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

771

def compressed_stream_index_from_coord(self, coord: Shape) -> int:

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

772

assert self.format == TensorFormat.WeightsCompressed

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

773

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

774

assert len(self.compressed_values) > 0

775

assert len(self.compressed_values) + 1 == len(self.weight_compressed_offsets)

776

777

depth = coord[-1]

778

brick_depth = self.brick_size[-1]

779

# Clamp position at final element index

780

if depth > self.shape[-1]:

781

depth = self.shape[-1]

782

783

# Always round up to next boundary

Michael McGeagh

8d3216f

2020-08-10 11:35:57 +0100

[diff] [blame]

784

index = numeric_util.round_up_divide(depth, brick_depth)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

785

786

# Check boundaries on all but last weight set (which may be shorter

787

# than the brick we divided it up into)

788

if index < len(self.weight_compressed_offsets) - 1:

789

# There are no half-way points in the weights

790

if (depth % brick_depth) != 0:

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

791

raise UnsupportedFeatureError("Offset into weights must be aligned to a brick")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

return index

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

795

def size_of_compressed_stream(self, index: int) -> int:

796

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

797

assert 0 <= index < len(self.compressed_values)

798

return len(self.compressed_values[index])

799

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

800

def is_last_index_in_compressed_stream(self, index: int) -> bool:

801

assert self.compressed_values is not None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

802

assert 0 <= index < len(self.compressed_values)

803

return index == len(self.compressed_values) - 1

804

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

805

def address_for_coordinate(

806

self,

807

orig_coord: Shape,

808

strides: Optional[List[int]] = None,

809

op_shape4D: Optional[Shape4D] = None,

810

is_top_box: bool = False,

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

811

) -> Optional[int]:

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

812

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

813

address_offset = 0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

814

assert self.purpose != TensorPurpose.Weights

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

815

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

816

# Strides may be passed as an argument, for example when creating feature maps as the strides may be modified

817

# by the "ofm_stride_multiplier" operation attribute. If not, they are calculated here.

818

if not strides:

819

strides = self.get_strides(op_shape4D)

coord = orig_coord

if is_top_box:

coord = [c - 1 for c in orig_coord]

824

address_offset += 1 * strides[-1] # one element

825

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

826

if self.sub_purpose == TensorSubPurpose.Standard:

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

827

shape = op_shape4D.as_list() if op_shape4D else self.shape

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

828

for _coord, _shape in zip(coord, shape):

829

assert _coord >= 0 and _coord < _shape

830

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

831

if op_shape4D and self.is_standard_fm:

832

storage_shape = self.get_4D_storage_shape_for_shape(op_shape4D).as_list()

833

storage_size = self.storage_size_for_shape(storage_shape)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

834

else:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

835

storage_shape = self.storage_shape

836

coord = coord[-len(storage_shape) :]

837

storage_size = self.storage_size()

Patrik Gustavsson

2021-01-21 08:28:55 +0100

[diff] [blame]

838

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

839

# Handle wraparound for partial buffers. Make sure to do this after subtracting top box

840

coord = [_coord % _shape for _coord, _shape in zip(coord, storage_shape)]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

841

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

842

augmented_coord = self.get_augmented_coord(coord)

843

assert augmented_coord is not None

844

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

845

address_offset += np.dot(augmented_coord, strides)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

846

Rickard Bolin

2022-09-21 08:24:51 +0000

[diff] [blame]

847

assert address_offset >= 0 and address_offset <= storage_size

Rickard Bolin

2022-09-06 16:09:01 +0000

[diff] [blame]

848

return self.address + address_offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

849

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

850

def is_allocated_in_tensor_arena(self, scratch_tensor_mem_area: MemArea) -> bool:

Michael McGeagh

f3e3ad7

2020-12-02 12:39:03 +0000

[diff] [blame]

851

return (self.mem_area == scratch_tensor_mem_area) and (self.mem_type in (MemType.Scratch, MemType.Scratch_fast))

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

852

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

853

def equivalent(self, tens: "Tensor") -> bool:

Louis Verhaard

2020-08-05 16:11:29 +0200

[diff] [blame]

854

return self.equivalence_id == tens.equivalence_id

855

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

856

def set_all_shapes(self, shape: Shape):

Michael McGeagh

6a8d424

2020-07-28 12:17:59 +0100

[diff] [blame]

857

self.shape = shape

858

self.storage_shape = shape

859

self.bandwidth_shape = shape

860

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

861

def get_full_shape(self) -> Shape:

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

862

d = len(self.shape)

863

if d in (1, 3):

Patrik Gustavsson

2020-12-01 16:02:29 +0100

[diff] [blame]

864

return full_shape(4, self.shape, 1)

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

865

elif d == 2:

866

return [self.shape[0], 1, 1, self.shape[1]]

867

else:

Fredrik Svedberg

835d8e1

2020-09-04 09:46:17 +0200

[diff] [blame]

868

return self.shape.copy()

Michael McGeagh

2020-08-06 17:31:02 +0100

[diff] [blame]

869

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

870

def is_quantized(self) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

871

# a tensor is quantized if it has an integral type and it contains valid quantization params

872

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

873

if not isinstance(self.quantization, QuantizationParameters):

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

874

return False

875

Tim Hall

2020-10-27 11:57:57 +0000

[diff] [blame]

876

return (self.dtype.type & BaseType.Int) != 0 and self.quantization.is_valid()

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

877

James Peet

7519d50

2021-07-19 16:47:58 +0100

[diff] [blame]

878

def get_scalar(self):

879

"""

880

return: Unquantized or dequantized scalar value

881

rtype: self.dtype (if unquantized) or float (if dequantized)

882

"""

883

assert self.values.size == 1, "get_scalar called on non-scalar tensor"

884

if self.is_quantized():

885

return self.quantization.dequantize(self.values).item(0)

886

else:

887

return self.values.item(0)

888

Ayaan Masood

a2ec5aa

2022-04-21 14:28:03 +0100

[diff] [blame]

889

def get_shape_as_2d(self, dimension_2_size: int) -> Optional[Shape4D]:

890

891

elms = self.elements()

892

dimension_1_size = elms // dimension_2_size

893

# Checks if the reduction works and shape is not 1D

894

is_reducible = dimension_1_size * dimension_2_size == elms and not (len(self.shape) == 1)

new_shape = None

if is_reducible:

new_shape = Shape4D([dimension_1_size, 1, 1, dimension_2_size])

return new_shape

Louis Verhaard

2020-12-17 13:54:09 +0100

[diff] [blame]

902

def __lt__(self, other: "Tensor") -> bool:

903

return self.equivalence_id < other.equivalence_id

904

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

905

def __str__(self):

906

return "<nng.Tensor '%s' shape=%s dtype=%s>" % (self.name, self.shape, self.dtype)

907

908

__repr__ = __str__

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

909

Michael McGeagh

2020-12-16 11:33:21 +0000

[diff] [blame]

910

def error(self, msg):

911

"""

912

Raises a VelaError exception for errors encountered when parsing a Tensor

913

914

:param self: Tensor object that resulted in the error

915

:param msg: str object that contains a description of the specific error encountered

916

"""

917

918

def _print_operators(ops):

919

lines = []

920

for idx, op in enumerate(ops):

921

op_type = getattr(op, "type", "Not an Operation")

922

op_id = getattr(op, "op_index", "-")

923

lines.append(f" {idx} = {op_type} ({op_id})")

924

return lines

925

926

lines = [f"Invalid {self.name} tensor. {msg}"]

927

928

lines += [" Driving operators:"]

929

lines += _print_operators(self.ops)

930

931

lines += [" Consuming operators:"]

932

lines += _print_operators(self.consumer_list)

933

934

raise VelaError("\n".join(lines))

935

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

936

Louis Verhaard

2020-12-08 10:02:31 +0100

[diff] [blame]

937

def check_quantized_tens_scaling_equal(tens_a: Tensor, tens_b: Tensor) -> bool:

Tim Hall

2020-09-09 21:58:15 +0100

[diff] [blame]

938

# checks that the scaling of two quantized tensors are equal

939

Tim Hall