Blame - ethosu/vela/architecture_features.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Rickard Bolin

bc6ee58

2022-11-04 08:24:29 +0000

[diff] [blame^]

16

#

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

17

# Description:

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

18

# Holds a container for Ethos-U and System architecture parameters.

Diego Russo

2020-04-14 18:41:58 +0100

[diff] [blame]

19

import enum

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

20

from collections import namedtuple

21

from configparser import ConfigParser

Diego Russo

2020-04-14 18:41:58 +0100

[diff] [blame]

22

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

23

import numpy as np

Diego Russo

2020-04-14 18:41:58 +0100

[diff] [blame]

24

Louis Verhaard

aeae567

2020-11-02 18:04:27 +0100

[diff] [blame]

25

from .api import NpuAccelerator

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

26

from .errors import CliOptionError

27

from .errors import ConfigOptionError

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

28

from .ethos_u55_regs.ethos_u55_regs import resampling_mode

Louis Verhaard

69b3176

2020-11-17 09:45:20 +0100

[diff] [blame]

29

from .numeric_util import full_shape

Diego Russo

e8a1045

2020-04-21 17:39:10 +0100

[diff] [blame]

30

from .numeric_util import round_up

31

from .numeric_util import round_up_divide

erik.andersson@arm.com

1d6d5c4

2021-04-14 13:31:05 +0200

[diff] [blame]

32

from .numeric_util import round_up_to_int

Tim Hall

4ed38bc

2020-10-20 18:54:20 +0100

[diff] [blame]

33

from .operation import Kernel

Diego Russo

2020-04-14 18:41:58 +0100

[diff] [blame]

34

from .operation import NpuBlockType

Tim Hall

4ed38bc

2020-10-20 18:54:20 +0100

[diff] [blame]

35

from .operation import PointXYZ

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

36

from .tensor import BandwidthDirection

Diego Russo

e8a1045

2020-04-21 17:39:10 +0100

[diff] [blame]

37

from .tensor import MemArea

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

38

from .tensor import MemType

Diego Russo

e8a1045

2020-04-21 17:39:10 +0100

[diff] [blame]

39

from .tensor import TensorFormat

40

from .tensor import TensorPurpose

Jonas Ohlsson

45e653d

2021-07-26 16:13:12 +0200

[diff] [blame]

41

from .tflite_supported_operators import TFLiteSupportedOperators

Patrik Gustavsson

8f1f9aa

2021-06-28 07:41:58 +0200

[diff] [blame]

42

from .tosa_supported_operators import TosaSupportedOperators

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

43

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

44

45

class Block:

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

46

def __init__(self, w=0, h=0, d=0):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

self.width = w

self.height = h

self.depth = d

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

51

def elements(self):

52

return self.width * self.height * self.depth

53

54

def elements_wh(self):

55

return self.width * self.height

56

57

def clone(self):

58

return Block(self.width, self.height, self.depth)

59

60

def as_list(self):

61

return [self.height, self.width, self.depth]

62

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

63

def __eq__(self, other):

64

if self.width == other.width and self.height == other.height and self.depth == other.depth:

return True

else:

return False

def __repr__(self):

return "<Block: {0},{1},{2}>".format(self.width, self.height, self.depth)

71

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

72

def to_hwc(self):

73

return [self.height, self.width, self.depth]

74

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

75

@classmethod

76

def from_string(cls, s):

77

w, h, c = (int(v) for v in s.split("x"))

78

return cls(w, h, c)

79

Louis Verhaard

69b3176

2020-11-17 09:45:20 +0100

[diff] [blame]

80

@classmethod

81

def from_shape(cls, shape) -> "Block":

82

"""Converts the shape to a Block"""

83

shp = full_shape(3, shape, 1)

84

# Note: index from end, as len(shp) may be > 3

85

return Block(shp[-2], shp[-3], shp[-1])

86

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

87

@classmethod

88

def min(cls, a, b):

89

return cls(min(a.width, b.width), min(a.height, b.height), min(a.depth, b.depth))

@classmethod

def max(cls, a, b):

return cls(max(a.width, b.width), max(a.height, b.height), max(a.depth, b.depth))

94

95

@classmethod

96

def round(cls, a, b):

97

return cls(round_up(a.width, b.width), round_up(a.height, b.height), round_up(a.depth, b.depth))

98

99

@classmethod

100

def div_round_up(cls, a, b):

101

return cls(

102

round_up_divide(a.width, b.width), round_up_divide(a.height, b.height), round_up_divide(a.depth, b.depth)

103

)

104

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

105

106

class Rect:

107

def __init__(self, x, y, z, x2, y2, z2):

self.x = x

self.y = y

self.z = z

self.x2 = x2

self.y2 = y2

self.z2 = z2

def start(self):

return PointXYZ(self.x, self.y, self.z)

117

118

def end(self):

119

return PointXYZ(self.x2, self.y2, self.z2)

120

121

def size(self):

122

return Block(self.x2 - self.x + 1, self.y2 - self.y + 1, self.z2 - self.z + 1)

123

124

def __repr__(self):

125

return "<Rect: ({0},{1},{2}) ({3},{4},{5})>".format(self.x, self.y, self.z, self.x2, self.y2, self.z2)

126

127

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

class SHRAMElements:

IFM8 = 0

IFM16 = 1

IFM8_Elementwise = 2

IFM16_Elementwise = 3

Fredrik Svedberg

597fd3f

2020-08-13 10:02:53 +0200

[diff] [blame]

133

IFM32 = 4

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

134

Acc16 = 5

135

Acc32 = 6

136

Acc40 = 7

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

137

Last = Acc40

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

138

BitSizes = np.array([8, 16, 8, 16, 32, 16, 32, 40], np.int32)

Louis Verhaard

f98c674

2020-05-12 14:22:38 +0200

[diff] [blame]

139

ByteSizes = BitSizes // 8

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

140

PostAlign = np.array([8, 8, 8, 8, 8, 1, 1, 1], np.int32)

141

PreAlign = np.array([1, 1, 1, 1, 1, 8, 8, 8], np.int32)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

143

144

class SHRAMBlockConfig:

145

def __init__(self, sizes, banks):

146

assert len(banks) == SHRAMElements.Last + 1

self.sizes = sizes

self.banks = banks

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

151

# Area indices must match Ethos-U SHRAM layout spec

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

152

class SharedBufferArea(enum.IntEnum):

OFM = 0

Weights = 1

IFM = 2

Accumulators = 3

Size = Accumulators + 1

158

159

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

160

class Accelerator(enum.Enum):

161

Ethos_U55_32 = "ethos-u55-32"

162

Ethos_U55_64 = "ethos-u55-64"

163

Ethos_U55_128 = "ethos-u55-128"

164

Ethos_U55_256 = "ethos-u55-256"

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

165

Ethos_U65_256 = "ethos-u65-256"

166

Ethos_U65_512 = "ethos-u65-512"

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

167

168

@classmethod

169

def member_list(cls):

170

return [e.value for e in cls]

171

Louis Verhaard

aeae567

2020-11-02 18:04:27 +0100

[diff] [blame]

172

@classmethod

173

def from_npu_accelerator(cls, npu_accelerator: NpuAccelerator) -> "Accelerator":

174

"""Converts the given public API object to Accelerator (used internally)"""

175

accelerator_map = {

176

NpuAccelerator.Ethos_U55_32: cls.Ethos_U55_32,

177

NpuAccelerator.Ethos_U55_64: cls.Ethos_U55_64,

178

NpuAccelerator.Ethos_U55_128: cls.Ethos_U55_128,

179

NpuAccelerator.Ethos_U55_256: cls.Ethos_U55_256,

180

NpuAccelerator.Ethos_U65_256: cls.Ethos_U65_256,

181

NpuAccelerator.Ethos_U65_512: cls.Ethos_U65_512,

182

}

183

assert npu_accelerator in accelerator_map, f"Unsupported accelerator {npu_accelerator}"

184

return accelerator_map[npu_accelerator]

185

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

186

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

187

@enum.unique

188

class MemPort(enum.Enum):

Axi0 = enum.auto()

Axi1 = enum.auto()

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

193

SHRAMConfig = namedtuple(

194

"SHRAMConfig", ["reserved_output_banks", "bank_size_bytes", "total_banks", "reserved_end_banks"]

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

198

class ArchitectureFeatures:

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

199

"""This class is a container for various parameters of the Ethos-U core

Diqing Zhong

2020-09-24 09:53:48 +0200

[diff] [blame]

200

and system configuration that can be tuned, either by command line

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

201

parameters or by the Ethos-U architects. The class is often passed

Diqing Zhong

2020-09-24 09:53:48 +0200

[diff] [blame]

202

around to passes that need to do architecture-dependent actions.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

203

Diqing Zhong

2020-09-24 09:53:48 +0200

[diff] [blame]

204

Note the difference between ArchitectureFeatures and CompilerOptions

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

205

- ArchitectureFeatures is for changing the Ethos-U and system architecture

Diqing Zhong

2020-09-24 09:53:48 +0200

[diff] [blame]

206

- CompilerOptions is for changing the behaviour of the compiler

207

"""

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

208

209

ArchitectureConfig = namedtuple(

210

"ArchitectureConfig", "macs cores ofm_ublock ifm_ublock shram_banks shram_granules elem_units"

211

)

212

accelerator_configs = {

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

213

Accelerator.Ethos_U65_512: ArchitectureConfig(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

214

256, 2, Block(2, 2, 8), Block(2, 2, 8), 48, [8, 8, 8, 8, 16, 8, 16, 20], 8

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

215

),

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

216

Accelerator.Ethos_U65_256: ArchitectureConfig(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

217

256, 1, Block(2, 2, 8), Block(2, 2, 8), 48, [8, 8, 8, 8, 16, 8, 16, 20], 8

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

218

),

219

Accelerator.Ethos_U55_256: ArchitectureConfig(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

220

256, 1, Block(2, 2, 8), Block(2, 2, 8), 48, [8, 8, 8, 8, 16, 8, 16, 20], 8

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

221

),

222

Accelerator.Ethos_U55_128: ArchitectureConfig(

Dwight Lidman

2f75457

2021-04-21 12:00:37 +0200

[diff] [blame]

223

128, 1, Block(2, 1, 8), Block(2, 1, 8), 24, [4, 4, 4, 4, 8, 4, 8, 12], 4

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

224

),

225

Accelerator.Ethos_U55_64: ArchitectureConfig(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

226

64, 1, Block(1, 1, 8), Block(1, 1, 8), 16, [2, 2, 2, 2, 4, 4, 4, 8], 2

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

227

),

228

Accelerator.Ethos_U55_32: ArchitectureConfig(

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

229

32, 1, Block(1, 1, 4), Block(1, 1, 8), 16, [2, 2, 2, 2, 4, 4, 4, 4], 1

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

230

),

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

231

}

232

233

OFMSplitDepth = 16

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

234

SubKernelMax = Block(8, 8, 65536)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

235

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

236

DEFAULT_CONFIG = "internal-default"

Louis Verhaard

1e17018

2020-11-26 11:42:04 +0100

[diff] [blame]

237

MAX_BLOCKDEP = 3

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

238

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

239

def __init__(

240

self,

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

241

vela_config_files,

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

242

accelerator_config,

243

system_config,

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

244

memory_mode,

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

245

max_blockdep,

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

246

verbose_config,

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

247

arena_cache_size,

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

248

):

249

accelerator_config = accelerator_config.lower()

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

250

if accelerator_config not in Accelerator.member_list():

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

251

raise CliOptionError("--accelerator-config", self.accelerator_config, "Unknown accelerator configuration")

Manupa Karunaratne

2020-07-20 12:05:32 +0100

[diff] [blame]

252

self.accelerator_config = Accelerator(accelerator_config)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

253

accel_config = ArchitectureFeatures.accelerator_configs[self.accelerator_config]

254

self.config = accel_config

255

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

256

self.accumulator_granules = {

257

SHRAMElements.Acc16: accel_config.shram_granules[SHRAMElements.Acc16],

258

SHRAMElements.Acc32: accel_config.shram_granules[SHRAMElements.Acc32],

259

SHRAMElements.Acc40: accel_config.shram_granules[SHRAMElements.Acc40],

260

}

261

262

self.ifm_bank_granules = {

263

8: accel_config.shram_granules[SHRAMElements.IFM8],

264

16: accel_config.shram_granules[SHRAMElements.IFM16],

265

32: accel_config.shram_granules[SHRAMElements.IFM32],

266

}

267

268

self.ifm_ew_bank_granules = {

269

8: accel_config.shram_granules[SHRAMElements.IFM8_Elementwise],

270

16: accel_config.shram_granules[SHRAMElements.IFM16_Elementwise],

271

32: accel_config.shram_granules[SHRAMElements.IFM32],

272

}

273

274

self.shram = SHRAMConfig(2, 1024, accel_config.shram_banks, 2 if accel_config.shram_banks > 16 else 0)

275

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

276

self.system_config = system_config

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

277

self.memory_mode = memory_mode

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

278

self.is_ethos_u65_system = self.accelerator_config in (Accelerator.Ethos_U65_256, Accelerator.Ethos_U65_512)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

279

Tim Hall

2021-08-06 13:51:34 +0100

[diff] [blame]

280

if self.is_ethos_u65_system:

281

self.max_outstanding_dma = 2

282

axi_port_address_width = 40

283

axi_port_data_width = 128

284

else:

285

self.max_outstanding_dma = 1

286

axi_port_address_width = 32

287

axi_port_data_width = 64

288

Tim Hall

289a41d

2020-08-04 21:40:14 +0100

[diff] [blame]

289

self.max_outstanding_kernels = 3

290

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

291

self.ncores = accel_config.cores

292

self.ofm_ublock = accel_config.ofm_ublock

293

self.ifm_ublock = accel_config.ifm_ublock

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

294

self.ofm_block_max = Block(64, 32, 128)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

295

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

296

self.max_blockdep = max_blockdep

297

298

dpu_min_height = accel_config.ofm_ublock.height

299

dpu_min_width = accel_config.ofm_ublock.width

300

dpu_dot_product_width = 8

301

dpu_min_ofm_channels = accel_config.ofm_ublock.depth

302

303

self.num_elem_wise_units = accel_config.elem_units

304

self.num_macs_per_cycle = dpu_min_height * dpu_min_width * dpu_dot_product_width * dpu_min_ofm_channels

Tim Hall

c1be087

2022-03-03 17:50:52 +0000

[diff] [blame]

305

assert self.num_macs_per_cycle == accel_config.macs, f"{self.num_macs_per_cycle} != {accel_config.macs}"

Louis Verhaard

a208cf8

2021-03-30 16:07:24 +0200

[diff] [blame]

306

# Max value in address offsets

Tim Hall

2021-08-06 13:51:34 +0100

[diff] [blame]

307

self.max_address_offset = 1 << axi_port_address_width

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

308

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

309

# Get system configuration and memory mode

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

310

self._get_vela_config(vela_config_files, verbose_config, arena_cache_size)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

311

Tim Hall

2021-08-06 13:51:34 +0100

[diff] [blame]

312

self.memory_bandwidths_per_cycle = axi_port_data_width * self.memory_clock_scales / 8

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

313

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

314

self.memory_bandwidths_per_second = self.memory_bandwidths_per_cycle * self.core_clock

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

315

Diqing Zhong

2020-09-24 09:53:48 +0200

[diff] [blame]

316

# Get output/activation performance numbers

317

self._generate_output_perf_tables(self.accelerator_config)

318

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

319

# sizes as N x H x W x C. we need to round up to these when allocating storage

320

self.storage_rounding_quantums = {

321

TensorFormat.Unknown: (1, 1, 1, 1),

322

TensorFormat.WeightsCompressed: (1, 1, 1, 1),

323

TensorFormat.NHWC: (1, 1, 1, 1),

324

TensorFormat.NHCWB16: (1, 1, 1, 16),

325

}

326

327

# brick sizes as N x H x W x C. We have to fetch whole bricks at a time

328

self.brick_sizes = {

329

TensorFormat.Unknown: (1, 1, 1, 1),

330

TensorFormat.WeightsCompressed: (1, 1, 1, 1),

331

TensorFormat.NHWC: (1, 1, 1, 1),

332

TensorFormat.NHCWB16: (1, 1, 1, 16),

333

}

334

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

335

self.default_weight_format = TensorFormat.WeightsCompressed

336

self.default_feature_map_format = TensorFormat.NHWC

337

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

338

self.tensor_storage_mem_area = {

339

# permanent mem_area

Tim Hall

465582c

2020-05-26 09:33:14 +0100

[diff] [blame]

340

TensorPurpose.Unknown: MemArea.Unknown,

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

341

TensorPurpose.Weights: self.permanent_storage_mem_area,

342

TensorPurpose.FeatureMap: self.feature_map_storage_mem_area,

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

343

TensorPurpose.LUT: self.permanent_storage_mem_area,

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

344

TensorPurpose.Scratch: self.feature_map_storage_mem_area,

345

TensorPurpose.ScratchFast: self.fast_storage_mem_area,

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

346

}

347

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

348

self.tensor_storage_mem_type = {

Dwight Lidman

1a9d20e

2020-08-11 12:10:36 +0200

[diff] [blame]

349

TensorPurpose.Unknown: MemType.Unknown,

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

350

TensorPurpose.Weights: MemType.Permanent_NPU,

351

TensorPurpose.FeatureMap: MemType.Scratch,

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

352

TensorPurpose.LUT: MemType.Scratch,

Fredrik Svedberg

e22ba8c

2021-01-27 16:53:41 +0100

[diff] [blame]

353

TensorPurpose.Scratch: MemType.Scratch,

354

TensorPurpose.ScratchFast: MemType.Scratch_fast,

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

355

}

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

356

357

self.min_block_sizes = {

358

NpuBlockType.Default: (dpu_min_height, dpu_min_width),

359

NpuBlockType.VectorProduct: (1, 1),

360

NpuBlockType.ConvolutionMxN: (dpu_min_height, dpu_min_width),

361

NpuBlockType.Pooling: (dpu_min_height, dpu_min_width),

362

NpuBlockType.ConvolutionDepthWise: (dpu_min_height, dpu_min_width),

363

NpuBlockType.ElementWise: (1, 1),

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

364

NpuBlockType.ReduceSum: (dpu_min_height, dpu_min_width),

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

365

}

366

367

self.sub_kernel_limits = {

368

NpuBlockType.Default: (8, 8),

369

NpuBlockType.VectorProduct: (1, 1),

370

NpuBlockType.ConvolutionMxN: (8, 8),

371

NpuBlockType.Pooling: (8, 8),

372

NpuBlockType.ConvolutionDepthWise: (8, 8),

373

NpuBlockType.ElementWise: (1, 1),

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

374

NpuBlockType.ReduceSum: (8, 8),

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

375

}

376

377

# weights for scheduler search

378

from .npu_performance import make_bandwidth_array

379

380

self.bandwidth_weights = make_bandwidth_array()

381

self.bandwidth_weights[MemArea.Sram] = 1.0

382

self.bandwidth_weights[MemArea.Dram] = 10.0

383

self.bandwidth_weights[MemArea.OnChipFlash] = 2.0

384

self.bandwidth_weights[MemArea.OffChipFlash] = 20.0

385

self.cycles_weight = 40

386

self.max_sram_used_weight = 1000

387

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

388

if self.is_spilling_enabled():

Patrik Gustavsson

3ab9452

2020-06-29 17:36:55 +0200

[diff] [blame]

389

self.max_sram_used_weight = 0

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

390

391

# Shared Buffer Block allocations

392

self.shram_bank_size = 1024 # bytes

393

self.shram_size_bytes = accel_config.shram_banks * self.shram_bank_size

394

self.shram_reserved_output_banks = 2

395

self.shram_reserved_weight_banks = 0

396

self.shram_reserved_unused_banks = 2 if accel_config.shram_banks > 16 else 0

397

self.shram_total_banks = accel_config.shram_banks - self.shram_reserved_unused_banks

398

self.shram_bank_granules = np.array(accel_config.shram_granules, np.int32)

Louis Verhaard

0b8268a

2020-08-05 16:11:29 +0200

[diff] [blame]

399

self.shram_lut_size = 2048

400

# SHRAM base address of the activation lookup table

401

self.shram_lut_address = self.shram_bank_size * self.available_shram_banks(True)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

402

403

# Build a map of acceptable IFM/OFM block configurations up to the maximum

404

# IFM/OFM block size.

405

ifm_block_max = self.get_ifm_block_size(32, self.ofm_block_max, Kernel(8, 8))

406

self.block_config_map = dict()

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

407

self.generate_block_config_map(Block(ifm_block_max.width * 2, ifm_block_max.height, 128))

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

408

409

# Setup supported operators and restriction checkers class

Jonas Ohlsson

45e653d

2021-07-26 16:13:12 +0200

[diff] [blame]

410

self.tflite_supported_operators = TFLiteSupportedOperators()

Patrik Gustavsson

8f1f9aa

2021-06-28 07:41:58 +0200

[diff] [blame]

411

self.tosa_supported_operators = TosaSupportedOperators()

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

412

Louis Verhaard

0b8268a

2020-08-05 16:11:29 +0200

[diff] [blame]

413

# Returns available number of SHRAM banks depending on activation lookup table

414

# being used or not

415

def available_shram_banks(self, uses_activation_lut):

416

banks = self.shram_total_banks

417

if uses_activation_lut and self.shram_reserved_unused_banks == 0:

banks -= 2

return banks

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

421

# Calculate block configuration for ALL known IFM operations and

422

# accumulator sizes. Consumers will need to select their preferred

423

# operation and bit-width at read-time.

424

def generate_block_config(self, width, height, depth):

Louis Verhaard

f98c674

2020-05-12 14:22:38 +0200

[diff] [blame]

425

# Number of bytes required for any SHRAM element for a FM of given dimensions.

426

# For IFM: size = H*W*Align(D*BYTE_WIDTH, 8)

427

# For ACC: size = H*W*Align(D,8)*BYTE_WIDTH

428

d1 = round_up(depth, SHRAMElements.PreAlign)

429

d2 = round_up(d1 * SHRAMElements.ByteSizes, SHRAMElements.PostAlign)

430

size_bytes = (height * width) * d2

431

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

432

# Convert byte size (rounded) to size in banks

433

size_banks = round_up_divide(size_bytes, self.shram_bank_size)

434

size_banks *= 2 # Double buffer the IFM/Acc (need twice as many banks)

435

# Round bank requirement to bank granularity

436

required_banks = round_up(size_banks, self.shram_bank_granules)

437

return SHRAMBlockConfig(size_bytes, required_banks)

438

439

@staticmethod

440

def make_block_config_key(width, height, depth):

441

return (int(height), int(width), int(depth))

442

443

def get_block_config(self, width, height, depth):

444

assert depth <= self.ofm_block_max.depth

445

key = ArchitectureFeatures.make_block_config_key(width, height, depth)

446

config = self.block_config_map.get(key, None)

447

return config

448

449

# Generate a key:value map of possible block configurations, where the

450

# key is compounded from the block dimensions: 0x00HHWWCC

451

def generate_block_config_map(self, block: Block):

452

for h in range(1, block.height + 1):

453

for w in range(1, block.width + 1):

454

# All possible IFM/OFM depth values

455

for c in [4, 8, 12, 16, 24, 32, 40, 48, 56, 64, 72, 80, 88, 96, 104, 112, 120, 128]:

456

key = ArchitectureFeatures.make_block_config_key(w, h, c)

457

self.block_config_map[key] = self.generate_block_config(w, h, c)

458

Diqing Zhong

2020-09-24 09:53:48 +0200

[diff] [blame]

459

def _generate_output_perf_tables(self, accel_config):

460

if accel_config == Accelerator.Ethos_U55_32:

461

self.output_cycles_per_elem = (2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0)

462

self.activation_cycles_per_elem = (1.0, 1.0, 0.0)

463

elif accel_config == Accelerator.Ethos_U55_64:

464

self.output_cycles_per_elem = (1.0, 1.5, 1.5, 1.5, 2.0, 3.0, 0.5, 1.0)

465

self.activation_cycles_per_elem = (1.0, 1.0, 0.0)

466

elif accel_config == Accelerator.Ethos_U55_128:

467

self.output_cycles_per_elem = (0.75, 1.25, 0.75, 0.75, 1.0, 1.5, 0.25, 0.5)

468

self.activation_cycles_per_elem = (1.0, 0.5, 0.0)

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

469

elif accel_config in (Accelerator.Ethos_U55_256, Accelerator.Ethos_U65_256):

Diqing Zhong

2020-09-24 09:53:48 +0200

[diff] [blame]

470

self.output_cycles_per_elem = (0.625, 1.125, 0.5, 0.375, 0.5, 0.75, 0.125, 0.25)

471

self.activation_cycles_per_elem = (1.0, 0.25, 0.0)

472

else:

Tim Hall

2020-10-27 12:43:14 +0000

[diff] [blame]

473

assert accel_config == Accelerator.Ethos_U65_512

Diqing Zhong

2020-09-24 09:53:48 +0200

[diff] [blame]

474

self.output_cycles_per_elem = (0.3125, 0.5625, 0.25, 0.1875, 0.25, 0.375, 0.0625, 0.125)

475

self.activation_cycles_per_elem = (0.5, 0.125, 0.0)

476

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

477

def calc_ifm_block_depth(self, ifm_depth, ifm_bits):

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

478

assert ifm_bits in (8, 16, 32)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

479

assert ifm_depth > 0

480

ifm_depth = round_up(ifm_depth, self.ifm_ublock.depth)

Fredrik Svedberg

2020-06-03 15:43:31 +0200

[diff] [blame]

481

max_block_depth = 8 * 32 // ifm_bits

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

482

return min(max_block_depth, ifm_depth)

483

484

# Calculate the size of the IFM block given a depth, target OFM block and a kernel

Tim Hall

c30f495

2020-06-15 20:47:35 +0100

[diff] [blame]

485

def get_ifm_block_size(

self,

ifm_block_depth,

ofm_block: Block,

kernel: Kernel,

subkernel: Block = Block(8, 8, 65536),

491

ifm_resampling_mode=resampling_mode.NONE,

492

):

Dwight Lidman

a9390f7

2020-05-13 12:00:08 +0200

[diff] [blame]

493

upscaling = 1 if ifm_resampling_mode == resampling_mode.NONE else 2

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

494

erik.andersson@arm.com

1d6d5c4

2021-04-14 13:31:05 +0200

[diff] [blame]

495

# Height

496

dilated_kernel_height = ((kernel.height - 1) * kernel.dilation.y) + 1

497

ifm_block_height = round_up_to_int(

498

((ofm_block.height - 1) * kernel.stride.y + min(subkernel.height, dilated_kernel_height)) / upscaling

499

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

500

Dwight Lidman

2f75457

2021-04-21 12:00:37 +0200

[diff] [blame]

501

ifm_block_height = round_up(ifm_block_height, self.ifm_ublock.height)

502

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

503

# Width

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

504

dilated_kernel_width = ((kernel.width - 1) * kernel.dilation.x) + 1

erik.andersson@arm.com

1d6d5c4

2021-04-14 13:31:05 +0200

[diff] [blame]

505

ifm_block_width = round_up_to_int(

506

((ofm_block.width - 1) * kernel.stride.x + min(subkernel.width, dilated_kernel_width)) / upscaling

507

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

508

Dwight Lidman

2f75457

2021-04-21 12:00:37 +0200

[diff] [blame]

509

ifm_block_width = round_up(ifm_block_width, self.ifm_ublock.width)

510

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

511

return Block(ifm_block_width, ifm_block_height, ifm_block_depth)

512

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

513

def is_spilling_enabled(self):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

514

"""

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

515

Spilling is a feature that allows the Ethos-U to use a dedicated SRAM as a cache for various types of data

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

516

"""

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

517

return (

518

self._mem_port_mapping(self.cache_mem_area) == MemArea.Sram and self.cache_mem_area != self.arena_mem_area

519

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

520

Louis Verhaard

024c355

2021-03-17 14:26:34 +0100

[diff] [blame]

521

def mem_type_size(self, mem_type: MemType) -> int:

patrik.gustavsson

6f23da6

2021-08-19 11:51:45 +0000

[diff] [blame]

522

"""Returns size in bytes available for the given memory type. This is a hard limit."""

523

if mem_type == MemType.Scratch_fast and self.is_spilling_enabled():

524

# when accessing the scratch fast memory type with memory spilling enabled the arena_cache_size refers to

525

# the cache memory area which is a hard limit

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

526

return self.arena_cache_size

Tim Hall

2021-08-06 13:51:34 +0100

[diff] [blame]

527

else:

patrik.gustavsson

6f23da6

2021-08-19 11:51:45 +0000

[diff] [blame]

528

# for all other memory types and modes the hard limit is the maximum possible address offset

Tim Hall

2021-08-06 13:51:34 +0100

[diff] [blame]

529

return self.max_address_offset

Louis Verhaard

024c355

2021-03-17 14:26:34 +0100

[diff] [blame]

530

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

531

def _mem_port_mapping(self, mem_port):

532

mem_port_mapping = {MemPort.Axi0: self.axi0_port, MemPort.Axi1: self.axi1_port}

533

return mem_port_mapping[mem_port]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

534

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

535

def _set_default_sys_config(self):

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

536

# ArchitectureFeatures.DEFAULT_CONFIG values

537

if self.is_ethos_u65_system:

538

# Default Ethos-U65 system configuration

539

# Ethos-U65 Client-Server: SRAM (16 GB/s) and DRAM (12 GB/s)

540

self.core_clock = 1e9

541

self.axi0_port = MemArea.Sram

542

self.axi1_port = MemArea.Dram

543

self.memory_clock_scales[MemArea.Sram] = 1.0

544

self.memory_clock_scales[MemArea.Dram] = 0.75 # 3 / 4

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

545

self.memory_burst_length[MemArea.Sram] = 32

546

self.memory_burst_length[MemArea.Dram] = 128

547

self.memory_latency[MemArea.Sram][BandwidthDirection.Read] = 32

548

self.memory_latency[MemArea.Sram][BandwidthDirection.Write] = 32

549

self.memory_latency[MemArea.Dram][BandwidthDirection.Read] = 500

550

self.memory_latency[MemArea.Dram][BandwidthDirection.Write] = 250

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

551

else:

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

552

# Default Ethos-U55 system configuration

553

# Ethos-U55 High-End Embedded: SRAM (4 GB/s) and Flash (0.5 GB/s)

554

self.core_clock = 500e6

555

self.axi0_port = MemArea.Sram

556

self.axi1_port = MemArea.OffChipFlash

557

self.memory_clock_scales[MemArea.Sram] = 1.0

558

self.memory_clock_scales[MemArea.OffChipFlash] = 0.125 # 1 / 8

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

559

self.memory_burst_length[MemArea.Sram] = 32

560

self.memory_burst_length[MemArea.OffChipFlash] = 128

561

self.memory_latency[MemArea.Sram][BandwidthDirection.Read] = 32

562

self.memory_latency[MemArea.Sram][BandwidthDirection.Write] = 32

563

self.memory_latency[MemArea.OffChipFlash][BandwidthDirection.Read] = 64

564

self.memory_latency[MemArea.OffChipFlash][BandwidthDirection.Write] = 64

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

565

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

566

def _set_default_mem_mode(self):

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

567

# ArchitectureFeatures.DEFAULT_CONFIG values

568

if self.is_ethos_u65_system:

569

# Default Ethos-U65 memory mode

Tim Hall

2020-12-22 11:47:54 +0000

[diff] [blame]

570

# Dedicated SRAM: the SRAM is only for use by the Ethos-U

571

# The non-SRAM memory is assumed to be read-writeable

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

572

self.const_mem_area = MemPort.Axi1

573

self.arena_mem_area = MemPort.Axi1

574

self.cache_mem_area = MemPort.Axi0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

575

self.arena_cache_size = 384 * 1024

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

576

else:

Tim Hall

2020-12-22 11:47:54 +0000

[diff] [blame]

577

# Default Ethos-U55 memory mode

578

# Shared SRAM: the SRAM is shared between the Ethos-U and the Cortex-M software

579

# The non-SRAM memory is assumed to be read-only

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

580

self.const_mem_area = MemPort.Axi1

581

self.arena_mem_area = MemPort.Axi0

582

self.cache_mem_area = MemPort.Axi0

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

583

self.arena_cache_size = self.max_address_offset

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

584

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

585

def _get_vela_config(self, vela_config_files, verbose_config, arena_cache_size_from_cli):

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

586

"""

587

Gets the system configuration and memory modes from one or more Vela configuration file(s) or uses some

588

defaults.

589

"""

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

590

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

591

# all properties are optional and are initialised to a value of 1 (or the equivalent)

592

self.core_clock = 1

593

self.axi0_port = MemArea(1)

594

self.axi1_port = MemArea(1)

595

self.memory_clock_scales = np.ones(MemArea.Size)

Tim Hall

2020-12-22 11:47:54 +0000

[diff] [blame]

596

self.memory_burst_length = np.ones(MemArea.Size, np.int)

597

self.memory_latency = np.zeros((MemArea.Size, BandwidthDirection.Size), np.int)

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

598

self.const_mem_area = MemPort(1)

599

self.arena_mem_area = MemPort(1)

600

self.cache_mem_area = MemPort(1)

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

601

self.arena_cache_size = self.max_address_offset

602

arena_cache_size_loc_text = "Default"

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

603

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

604

# read configuration file(s)

605

self.vela_config = None

606

607

if vela_config_files is not None:

608

self.vela_config = ConfigParser()

609

self.vela_config.read(vela_config_files)

610

611

# read system configuration

612

sys_cfg_section = "System_Config." + self.system_config

613

614

if self.vela_config is not None and self.vela_config.has_section(sys_cfg_section):

615

self.core_clock = float(self._read_config(sys_cfg_section, "core_clock", self.core_clock))

616

self.axi0_port = MemArea[self._read_config(sys_cfg_section, "axi0_port", self.axi0_port)]

617

self.axi1_port = MemArea[self._read_config(sys_cfg_section, "axi1_port", self.axi1_port)]

618

619

for mem_area in (self.axi0_port, self.axi1_port):

620

self.memory_clock_scales[mem_area] = float(

621

self._read_config(

622

sys_cfg_section, mem_area.name + "_clock_scale", self.memory_clock_scales[mem_area]

623

)

624

)

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

625

self.memory_burst_length[mem_area] = int(

626

self._read_config(

627

sys_cfg_section, mem_area.name + "_burst_length", self.memory_burst_length[mem_area]

628

)

629

)

630

self.memory_latency[mem_area][BandwidthDirection.Read] = int(

631

self._read_config(

632

sys_cfg_section,

633

mem_area.name + "_read_latency",

634

self.memory_latency[mem_area][BandwidthDirection.Read],

635

)

636

)

637

self.memory_latency[mem_area][BandwidthDirection.Write] = int(

638

self._read_config(

639

sys_cfg_section,

640

mem_area.name + "_write_latency",

641

self.memory_latency[mem_area][BandwidthDirection.Write],

642

)

643

)

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

644

elif self.system_config == ArchitectureFeatures.DEFAULT_CONFIG:

645

self._set_default_sys_config()

646

647

elif vela_config_files is None:

Michael McGeagh

7a6f843

2020-12-02 15:29:22 +0000

[diff] [blame]

648

raise CliOptionError("--config", vela_config_files, "Vela config file not specified")

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

649

650

else:

651

raise CliOptionError(

Jonas Ohlsson

d857507

2022-03-30 10:30:25 +0200

[diff] [blame]

652

"--system-config",

653

self.system_config,

654

f"Section {sys_cfg_section} not found in Vela config file",

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

655

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

656

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

657

# read the memory mode

658

mem_mode_section = "Memory_Mode." + self.memory_mode

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

659

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

660

if self.vela_config is not None and self.vela_config.has_section(mem_mode_section):

661

self.const_mem_area = MemPort[

662

self._read_config(mem_mode_section, "const_mem_area", self.const_mem_area.name)

663

]

664

self.arena_mem_area = MemPort[

665

self._read_config(mem_mode_section, "arena_mem_area", self.arena_mem_area.name)

666

]

667

self.cache_mem_area = MemPort[

668

self._read_config(mem_mode_section, "cache_mem_area", self.cache_mem_area.name)

669

]

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

670

found = []

671

self.arena_cache_size = int(

672

self._read_config(mem_mode_section, "arena_cache_size", self.arena_cache_size, found)

673

)

674

if found[-1]:

675

arena_cache_size_loc_text = "Configuration file"

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

676

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

677

elif self.memory_mode == ArchitectureFeatures.DEFAULT_CONFIG:

678

self._set_default_mem_mode()

Patrik Gustavsson

5f47c05

2020-06-25 12:56:04 +0200

[diff] [blame]

679

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

680

elif vela_config_files is None:

Michael McGeagh

7a6f843

2020-12-02 15:29:22 +0000

[diff] [blame]

681

raise CliOptionError("--config", vela_config_files, "Vela config file not specified")

Patrik Gustavsson

2020-05-27 09:15:11 +0200

[diff] [blame]

682

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

683

else:

684

raise CliOptionError(

Jonas Ohlsson

d857507

2022-03-30 10:30:25 +0200

[diff] [blame]

685

"--memory-mode",

686

self.memory_mode,

687

f"Section {mem_mode_section} not found in Vela config file",

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

688

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

689

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

690

# override sram to onchipflash

691

if self._mem_port_mapping(self.const_mem_area) == MemArea.Sram:

692

if self.const_mem_area == self.arena_mem_area == self.cache_mem_area:

693

print(

694

"Info: Changing const_mem_area from Sram to OnChipFlash. This will use the same characteristics as"

695

" Sram."

696

)

697

if self.const_mem_area == MemPort.Axi0:

698

self.const_mem_area = MemPort.Axi1

699

self.axi1_port = MemArea.OnChipFlash

700

else:

701

self.const_mem_area = MemPort.Axi0

702

self.axi0_port = MemArea.OnChipFlash

703

self.memory_clock_scales[MemArea.OnChipFlash] = self.memory_clock_scales[MemArea.Sram]

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

704

self.memory_burst_length[MemArea.OnChipFlash] = self.memory_burst_length[MemArea.Sram]

705

self.memory_latency[MemArea.OnChipFlash] = self.memory_latency[MemArea.Sram]

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

706

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

707

# override sram usage

708

if arena_cache_size_from_cli is not None:

709

self.arena_cache_size = arena_cache_size_from_cli

710

arena_cache_size_loc_text = "CLI option"

711

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

712

# check configuration

Tim Hall

2020-12-22 11:47:54 +0000

[diff] [blame]

713

if self._mem_port_mapping(self.const_mem_area) not in (

714

MemArea.Dram,

715

MemArea.OnChipFlash,

716

MemArea.OffChipFlash,

717

):

718

raise ConfigOptionError(

719

"const_mem_area",

720

self._mem_port_mapping(self.const_mem_area).name,

721

"Dram or OnChipFlash or OffChipFlash",

722

)

723

724

if self._mem_port_mapping(self.arena_mem_area) not in (MemArea.Sram, MemArea.Dram):

725

raise ConfigOptionError("arena_mem_area", self._mem_port_mapping(self.arena_mem_area).name, "Sram or Dram")

726

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

727

if self._mem_port_mapping(self.cache_mem_area) != MemArea.Sram:

728

raise ConfigOptionError("cache_mem_area", self._mem_port_mapping(self.cache_mem_area).name, "Sram")

729

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

730

if self.arena_cache_size < 0:

731

raise ConfigOptionError("arena_cache_size", self.arena_cache_size, ">= 0")

732

if self.arena_cache_size > self.max_address_offset:

733

raise ConfigOptionError(

734

"arena_cache_size",

735

f"{self.arena_cache_size}. Size is out of bounds, maximum is: {self.max_address_offset}",

736

)

737

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

738

# assign existing memory areas

739

self.permanent_storage_mem_area = self._mem_port_mapping(self.const_mem_area)

740

self.feature_map_storage_mem_area = self._mem_port_mapping(self.arena_mem_area)

741

self.fast_storage_mem_area = self._mem_port_mapping(self.cache_mem_area)

742

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

743

# display the system configuration and memory mode

744

if verbose_config:

Rickard Bolin

7ce6b32

2022-06-02 09:30:33 +0000

[diff] [blame]

745

print("Configuration files:")

746

print(f" {vela_config_files}")

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

747

print(f"System Configuration ({self.system_config}):")

748

print(f" core_clock = {self.core_clock}")

749

print(f" axi0_port = {self.axi0_port.name}")

750

print(f" axi1_port = {self.axi1_port.name}")

751

for mem in (MemArea.Sram, MemArea.Dram, MemArea.OnChipFlash, MemArea.OffChipFlash):

752

print(f" {mem.name}_clock_scales = {self.memory_clock_scales[mem]}")

Diqing Zhong

2020-12-11 13:07:37 +0100

[diff] [blame]

753

print(f" {mem.name}_burst_length = {self.memory_burst_length[mem]}")

754

print(f" {mem.name}_read_latency = {self.memory_latency[mem][BandwidthDirection.Read]}")

755

print(f" {mem.name}_write_latency = {self.memory_latency[mem][BandwidthDirection.Write]}")

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

756

757

print(f"Memory Mode ({self.memory_mode}):")

758

print(f" const_mem_area = {self.const_mem_area.name}")

759

print(f" arena_mem_area = {self.arena_mem_area.name}")

760

print(f" cache_mem_area = {self.cache_mem_area.name}")

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

761

print(f" arena_cache_size = {self.arena_cache_size} from {arena_cache_size_loc_text}")

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

762

763

print("Architecture Settings:")

764

print(f" permanent_storage_mem_area = {self.permanent_storage_mem_area.name}")

765

print(f" feature_map_storage_mem_area = {self.feature_map_storage_mem_area.name}")

766

print(f" fast_storage_mem_area = {self.fast_storage_mem_area.name}")

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

767

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

768

def _read_config(self, section, key, current_value, found=None):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

769

"""

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

770

Reads a given key from a particular section in the Vela config file. If the section contains the 'inherit'

771

option then we recurse into the section specified. If inherited sections result in multiple keys for a

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

772

particular option then the key from the parent section is used, regardless of the parsing order. if specified

773

found should be an empty list that this function will append a True or False to the end of the list indicating

774

whether the key was found or not.

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

775

"""

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

776

if not self.vela_config.has_section(section):

Michael McGeagh

7a6f843

2020-12-02 15:29:22 +0000

[diff] [blame]

777

raise ConfigOptionError("section", f"{section}. The section was not found in the Vela config file(s)")

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

778

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

779

result = str(current_value) if current_value is not None else None

780

if found is not None:

781

found.append(False)

782

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

783

if self.vela_config.has_option(section, "inherit"):

784

inheritance_section = self.vela_config.get(section, "inherit")

785

# check for recursion loop

786

if inheritance_section == section:

787

raise ConfigOptionError(

Jonas Ohlsson

d857507

2022-03-30 10:30:25 +0200

[diff] [blame]

788

"inherit",

789

f"{inheritance_section}. This references its own section and recursion is not allowed",

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

790

)

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

791

result = self._read_config(inheritance_section, key, result, found)

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

792

793

if self.vela_config.has_option(section, key):

794

result = self.vela_config.get(section, key)

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

795

if found is not None:

796

found.append(True)

Tim Hall

2020-11-01 20:59:36 +0000

[diff] [blame]

797

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

798

return result

Louis Verhaard

5207830

2020-11-18 13:35:06 +0100

[diff] [blame]

799

800

Louis Verhaard

2020-11-27 08:24:03 +0100

[diff] [blame]

801

# Cache for default arch instances, as these are expensive to create

802

default_arch_cache = dict()

803

804

Louis Verhaard

5207830

2020-11-18 13:35:06 +0100

[diff] [blame]

805

def create_default_arch(accelerator: Accelerator) -> ArchitectureFeatures:

806

"""Creates architecture features object using default settings"""

Louis Verhaard

2020-11-27 08:24:03 +0100

[diff] [blame]

807

if accelerator not in default_arch_cache:

808

default_arch_cache[accelerator] = ArchitectureFeatures(

809

vela_config_files=None,

810

accelerator_config=accelerator.value,

811

system_config=ArchitectureFeatures.DEFAULT_CONFIG,

812

memory_mode=ArchitectureFeatures.DEFAULT_CONFIG,

Louis Verhaard

2020-11-27 08:24:03 +0100

[diff] [blame]

813

max_blockdep=ArchitectureFeatures.MAX_BLOCKDEP,

Louis Verhaard

2020-11-27 08:24:03 +0100

[diff] [blame]

814

verbose_config=False,

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

815

arena_cache_size=None,

Louis Verhaard