Blame - ethosu/vela/vela.py - ml/ethos-u/ethos-u-vela

2020-04-27 18:20:16 +0100

[diff] [blame]

2

#

3

# SPDX-License-Identifier: Apache-2.0

4

#

5

# Licensed under the Apache License, Version 2.0 (the License); you may

6

# not use this file except in compliance with the License.

7

# You may obtain a copy of the License at

8

#

9

# www.apache.org/licenses/LICENSE-2.0

10

#

11

# Unless required by applicable law or agreed to in writing, software

12

# distributed under the License is distributed on an AS IS BASIS, WITHOUT

13

# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

14

# See the License for the specific language governing permissions and

15

# limitations under the License.

Rickard Bolin

bc6ee58

2022-11-04 08:24:29 +0000

[diff] [blame]

16

#

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

17

# Description:

18

# Main entry point for the Vela compiler.

19

#

20

# Provides command line interface, options parsing, and network loading. Before calling the compiler driver.

Diego Russo

2020-04-21 17:39:10 +0100

[diff] [blame]

21

import argparse

Alexander Hansson

2466d81

2023-05-17 12:38:46 +0000

[diff] [blame^]

22

import datetime

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

23

import glob

Tim Hall

1bd531d

2020-11-01 20:59:36 +0000

[diff] [blame]

24

import os

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

25

import sys

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

26

import time

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

27

erik.andersson@arm.com

2021-02-03 10:20:16 +0100

[diff] [blame]

28

import flatbuffers

29

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

30

from . import architecture_features

Diego Russo

2020-04-21 17:39:10 +0100

[diff] [blame]

31

from . import compiler_driver

32

from . import model_reader

Diqing Zhong

2021-08-16 17:24:09 +0200

[diff] [blame]

33

from . import rawdata_writer

Diego Russo

2020-04-21 17:39:10 +0100

[diff] [blame]

34

from . import scheduler

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

35

from . import stats_writer

36

from . import tflite_writer

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

37

from ._version import __version__

Louis Verhaard

11831ce

2020-11-18 18:53:24 +0100

[diff] [blame]

38

from .api import API_VERSION

Tim Hall

2020-11-09 16:46:37 +0000

[diff] [blame]

39

from .debug_database import DebugDatabase

Louis Verhaard

7db7896

2020-05-25 15:05:26 +0200

[diff] [blame]

40

from .errors import InputFileError

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

41

from .errors import VelaError

Tim Hall

cda4fcb

2022-05-19 12:36:58 +0100

[diff] [blame]

42

from .hillclimb_allocation import HillClimbAllocator

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

43

from .nn_graph import NetworkType

Diego Russo

2020-04-21 17:39:10 +0100

[diff] [blame]

44

from .nn_graph import TensorAllocator

Diego Russo

ea6111a

2020-04-14 18:41:58 +0100

[diff] [blame]

45

from .tensor import MemArea

Jacob Bohlin

0628a8c

2020-08-28 13:25:14 +0200

[diff] [blame]

46

from .tensor import Tensor

erik.andersson@arm.com

2021-02-03 10:20:16 +0100

[diff] [blame]

47

from .tflite.Model import Model

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

48

from .tflite_mapping import builtin_operator_map

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

49

from .tflite_mapping import builtin_operator_name_map

Fredrik Svedberg

2022-09-16 16:24:55 +0200

[diff] [blame]

50

from .tflite_mapping import optype_to_builtintype

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

51

from .tflite_model_semantic import TFLiteSemantic

52

from .tflite_supported_operators import TFLiteSupportedOperators

53

from .tosa_model_semantic import TosaSemantic

54

from .tosa_supported_operators import TosaSupportedOperators

Louis Verhaard

5207830

2020-11-18 13:35:06 +0100

[diff] [blame]

55

from ethosu.vela.architecture_features import ArchitectureFeatures

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

56

Rickard Bolin

7ce6b32

2022-06-02 09:30:33 +0000

[diff] [blame]

57

CONFIG_FILES_PATH = os.path.normpath(os.path.join(__file__, "..", "..", "config_files"))

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

58

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

59

Tim Hall

2020-11-09 16:46:37 +0000

[diff] [blame]

60

def process(input_name, enable_debug_db, arch, model_reader_options, compiler_options, scheduler_options):

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

61

if compiler_options.timing:

62

start = time.time()

63

Tim Hall

2020-11-09 16:46:37 +0000

[diff] [blame]

64

os.makedirs(compiler_options.output_dir, exist_ok=True)

65

output_basename = os.path.join(compiler_options.output_dir, os.path.splitext(os.path.basename(input_name))[0])

66

DebugDatabase.show_warnings = enable_debug_db

67

Patrik Gustavsson

8f1f9aa

2021-06-28 07:41:58 +0200

[diff] [blame]

68

nng, network_type = model_reader.read_model(input_name, model_reader_options)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

69

70

if not nng:

Michael McGeagh

7a6f843

2020-12-02 15:29:22 +0000

[diff] [blame]

71

raise InputFileError(input_name, "Input file could not be read")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

72

73

if compiler_options.verbose_operators:

74

nng.print_operators()

75

76

if compiler_options.timing:

77

stop = time.time()

78

print("Model reading took %f s" % (stop - start))

79

start = time.time()

80

wilisa01

89a8cdd

2022-08-22 16:13:06 +0000

[diff] [blame]

81

compiler_driver.compiler_driver(nng, arch, compiler_options, scheduler_options, network_type, output_basename)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

82

Tim Hall

2020-11-09 16:46:37 +0000

[diff] [blame]

83

summary_csv_file = "{0}_summary_{1}.csv".format(output_basename, arch.system_config)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

84

stats_writer.write_summary_metrics_csv(nng, summary_csv_file, arch)

85

Fredrik Svedberg

f5c07c4

2021-04-23 14:36:42 +0200

[diff] [blame]

86

stats_writer.print_performance_metrics(

87

nng,

88

show_cpu_operations=compiler_options.show_cpu_operations,

89

verbose_weights=compiler_options.verbose_weights,

90

arch=arch,

91

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

92

Diqing Zhong

2021-08-16 17:24:09 +0200

[diff] [blame]

93

output_tfl_filename = output_basename + "_vela.tflite"

Patrik Gustavsson

b081d67

2021-08-25 13:49:25 +0200

[diff] [blame]

94

if input_name.endswith(".tflite"):

Diqing Zhong

2021-08-16 17:24:09 +0200

[diff] [blame]

95

tflite_writer.write_tflite(nng, output_tfl_filename)

Patrik Gustavsson

c74682c

2021-08-17 14:26:38 +0200

[diff] [blame]

96

if input_name.endswith(".tosa"):

Diqing Zhong

2021-08-16 17:24:09 +0200

[diff] [blame]

97

rawdata_writer.write_rawdata_output(nng, arch, output_basename)

Tim Hall

2020-11-09 16:46:37 +0000

[diff] [blame]

98

99

if enable_debug_db:

Diqing Zhong

2021-08-16 17:24:09 +0200

[diff] [blame]

100

file_offsets = calculate_operator_file_offsets(output_tfl_filename)

erik.andersson@arm.com

2021-02-03 10:20:16 +0100

[diff] [blame]

101

for idx, offset in enumerate(sorted(file_offsets)):

102

sg = find_subgraph_with_command_stream_order(nng, idx)

103

if sg is not None:

104

DebugDatabase.set_stream_offset(sg, offset)

Tim Hall

2020-11-09 16:46:37 +0000

[diff] [blame]

105

debug_filename = output_basename + "_debug.xml"

Diqing Zhong

2021-08-16 17:24:09 +0200

[diff] [blame]

106

DebugDatabase.write(debug_filename, input_name, output_tfl_filename)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

107

108

if compiler_options.timing:

109

stop = time.time()

110

print("Compiler driver took %f s" % (stop - start))

return nng

erik.andersson@arm.com

2021-02-03 10:20:16 +0100

[diff] [blame]

115

def find_subgraph_with_command_stream_order(nng, idx):

116

for sg in nng.subgraphs:

117

if sg.generated_stream_id == idx:

return sg

return None

def calculate_operator_file_offsets(name: str):

123

# Read the vela optimized tflite file

124

with open(name, "rb") as f:

125

buf = bytearray(f.read())

126

# Calculate the file offsets for each custom operator

127

file_offsets = []

128

model = Model.GetRootAsModel(buf, 0)

129

for idx in range(model.SubgraphsLength()): # However only one subgraph is supported as of now

130

sg = model.Subgraphs(idx)

131

for idx in range(sg.OperatorsLength()):

132

operator = sg.Operators(idx)

133

if model.OperatorCodes(operator.OpcodeIndex()).CustomCode() is not None:

134

tensor_idx = operator.Inputs(0)

135

tensor = sg.Tensors(tensor_idx)

136

buffer = model.Buffers(tensor.Buffer())

137

offset = flatbuffers.number_types.UOffsetTFlags.py_type(buffer._tab.Offset(4))

138

file_offsets.append(buffer._tab.Vector(offset))

return file_offsets

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

142

def print_subgraph_io_summary(nng):

143

"""Print a summary of all the input and output tensor sizes for all subgraphs.

144

Also displays the total tensor size and the memory used area for sram.

145

"""

146

147

print("Subgraph IO Summary")

148

print("-------------------")

James Ward

2021-10-14 12:58:02 +0100

[diff] [blame]

149

print(f"NNG: {nng.name}")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

150

max_sg_size = 0

151

for sg in reversed(nng.subgraphs):

James Ward

2021-10-14 12:58:02 +0100

[diff] [blame]

152

print(f" NNG Subgraph: {sg.name} = {sg.placement}")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

153

sg_size = 0

154

James Ward

2021-10-14 12:58:02 +0100

[diff] [blame]

155

if hasattr(sg, "scratch_tensor") and sg.scratch_tensor is not None:

156

sg_tensors = sg.input_tensors + [sg.scratch_tensor] + sg.output_tensors

157

else:

158

sg_tensors = sg.input_tensors + sg.output_tensors

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

159

James Ward

2021-10-14 12:58:02 +0100

[diff] [blame]

160

for tens in sg_tensors:

161

if tens in sg.input_tensors:

162

tens_dir = "In"

163

elif tens in sg.output_tensors:

164

tens_dir = "Out"

165

else:

166

tens_dir = "In/Out"

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

167

James Ward

2021-10-14 12:58:02 +0100

[diff] [blame]

168

size = tens.elements() * tens.element_size() / 1024.0

169

sg_size = sg_size + size

170

print(f" Tensor [{tens_dir}]: {tens.name} = {size} KiB")

171

172

print(f" Total Size = {sg_size} KiB")

173

print(f" SRAM Memory Used = {sg.memory_used.get(MemArea.Sram, 0) / 1024.0} KiB")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

174

max_sg_size = max(sg_size, max_sg_size)

175

James Ward

2021-10-14 12:58:02 +0100

[diff] [blame]

176

print(f" Maximum NNG Subgraph Size = {max_sg_size} KiB")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

177

178

Alexander Hansson

2466d81

2023-05-17 12:38:46 +0000

[diff] [blame^]

179

def generate_license():

lines = [

"<!--",

"Arm Limited and/or its affiliates <open-source-office@arm.com>",

184

"",

185

"SPDX-License-Identifier: Apache-2.0",

186

"",

187

"Licensed under the Apache License, Version 2.0 (the License); you may",

188

"not use this file except in compliance with the License.",

189

"You may obtain a copy of the License at",

190

"",

191

"www.apache.org/licenses/LICENSE-2.0",

192

"",

193

"Unless required by applicable law or agreed to in writing, software",

194

"distributed under the License is distributed on an AS IS BASIS, WITHOUT",

195

"WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.",

196

"See the License for the specific language governing permissions and",

197

"limitations under the License.",

"-->",

]

return lines

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

203

def generate_supported_ops():

Jonas Ohlsson

0957e3e

2021-09-01 15:57:21 +0200

[diff] [blame]

204

# Exclude network type from generation by adding value to exclude list.

205

# To easily exclude NetworkType from generated documentation.

206

exclude_generation_network_type_value = [NetworkType.TOSA.value]

207

Fredrik Svedberg

2022-09-16 16:24:55 +0200

[diff] [blame]

208

def _exclude_list_names(constraint, exclude_list):

209

constraints_excluded_names = [

210

optype_to_builtintype(op) for op, exclude_constraint in exclude_list if constraint in exclude_constraint

211

]

212

return f" - [{', '.join(sorted(constraints_excluded_names))}]" if constraints_excluded_names else ""

213

Alexander Hansson

2466d81

2023-05-17 12:38:46 +0000

[diff] [blame^]

214

lines = generate_license()

215

lines += [

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

216

"# Supported Ops",

217

"",

218

"This file was automatically generated by Vela using the `--supported-ops-report` parameter. ",

219

f"Vela version: `{__version__}`",

220

"",

Michael McGeagh

54a6111

2020-11-24 14:58:51 +0000

[diff] [blame]

221

"This file complies with",

222

"[**Gitiles Markdown syntax**](https://github.com/google/gitiles/blob/master/Documentation/markdown.md)",

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

223

"",

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

224

"Summary table of constraints for:",

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

225

]

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

226

227

for network_type in NetworkType:

Jonas Ohlsson

0957e3e

2021-09-01 15:57:21 +0200

[diff] [blame]

228

if network_type.value in exclude_generation_network_type_value:

229

continue

230

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

231

lines += [

232

f"- [{network_type.name}](#{network_type.name.lower()}-summary-table)",

233

]

234

235

for network_type in NetworkType:

Jonas Ohlsson

0957e3e

2021-09-01 15:57:21 +0200

[diff] [blame]

236

if network_type.value in exclude_generation_network_type_value:

237

continue

238

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

239

lines += [

240

"",

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

241

f"## {network_type.name} Summary Table",

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

242

"",

243

]

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

244

if network_type == NetworkType.TFLite:

245

lines += [

246

"The table below contains TFLite operators that can be placed on the Ethos-U NPU. ",

247

"If the constraints are not met, then that operator will be scheduled on the CPU instead. ",

248

"For any other TFLite operator not listed, will be left untouched and scheduled on the CPU. ",

249

"Please check the supported operator list for your chosen runtime for further information.",

250

"",

251

"| Operator | TFLite Constraints |",

252

"| --- | --- |",

253

]

254

semantic_checker = TFLiteSemantic()

255

supported = TFLiteSupportedOperators()

256

elif network_type == NetworkType.TOSA:

257

lines += [

258

"The table below contains TOSA operators that can be placed on the Ethos-U NPU. ",

259

"Note: There is limited support for compiling a TOSA neural network (EXPERIMENTAL). ",

260

"The related constraints have not yet been populated in the list.",

261

"",

262

"| Operator | TOSA Constraints |",

263

"| --- | --- |",

264

]

265

semantic_checker = TosaSemantic()

266

supported = TosaSupportedOperators()

else:

raise ValueError

op_constraint_links = []

Tim Hall

a3fe665

2022-03-03 17:43:16 +0000

[diff] [blame]

271

op_list = sorted(((op, builtin_operator_name_map[op]) for op in builtin_operator_map), key=lambda x: x[1])

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

272

for op, name in op_list:

273

internal_op = builtin_operator_map[op][0]

274

if internal_op in TFLiteSupportedOperators.supported_operators:

275

links = f"[Generic](#{network_type.name.lower()}-generic-constraints)"

276

if (

277

internal_op in supported.specific_constraints

278

or internal_op in semantic_checker.specific_constraints

279

):

280

links += f", [Specific](#{network_type.name.lower()}-{name.lower()}-constraints)"

281

op_constraint_links.append((internal_op, name))

282

lines.append(f"| {name} | {links} |")

283

lines += [

284

"",

285

f"### {network_type.name} Generic Constraints",

286

"",

Ayaan Masood

4965fae

2022-06-29 11:30:57 +0100

[diff] [blame]

287

"This is a list of constraints most NPU operators must satisfy in order to be scheduled on the NPU.",

288

"(Operators excluded from certain constraints are shown in brackets [ ] )\n" "",

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

289

]

290

for constraint in semantic_checker.generic_constraints:

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

291

# Markdown needs two spaces at the end of a line to render it as a separate line

292

reason = constraint.__doc__.replace("\n", " \n")

Ayaan Masood

4965fae

2022-06-29 11:30:57 +0100

[diff] [blame]

293

exclude_list = TFLiteSemantic.get_generic_constraint_exclude_list().items()

Fredrik Svedberg

2022-09-16 16:24:55 +0200

[diff] [blame]

294

lines.append(f"- {reason}{_exclude_list_names(constraint, exclude_list)}")

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

295

for constraint in supported.generic_constraints:

296

# Markdown needs two spaces at the end of a line to render it as a separate line

297

reason = constraint.__doc__.replace("\n", " \n")

Fredrik Svedberg

2022-09-16 16:24:55 +0200

[diff] [blame]

298

exclude_list = supported.generic_constraints_exceptions.items()

299

lines.append(f"- {reason}{_exclude_list_names(constraint, exclude_list)}")

Jonas Ohlsson

2021-07-26 16:13:12 +0200

[diff] [blame]

300

for op, name in op_constraint_links:

301

lines += [

302

"",

303

f"### {network_type.name} {name} Constraints",

304

"",

305

f"This is a list of constraints that the {name} operator must satisfy in order to be scheduled on the"

" NPU.",

"",

]

for constraint in semantic_checker.specific_constraints[op]:

310

# Markdown needs two spaces at the end of a line to render it as a separate line

311

reason = constraint.__doc__.replace("\n", " \n")

312

lines.append(f"- {reason}")

313

for constraint in supported.specific_constraints[op]:

314

# Markdown needs two spaces at the end of a line to render it as a separate line

315

reason = constraint.__doc__.replace("\n", " \n")

316

lines.append(f"- {reason}")

Michael McGeagh

2020-11-10 12:38:25 +0000

[diff] [blame]

317

318

# Note. this will generate the file in the CWD

319

filepath = os.path.join(os.getcwd(), "SUPPORTED_OPS.md")

320

with open(filepath, "wt") as md:

321

md.writelines(line + "\n" for line in lines)

322

print(f"Report file: {filepath}")

323

324

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

325

def list_config_files():

Rickard Bolin

9b8b448

2022-05-24 07:43:03 +0000

[diff] [blame]

326

print("Available config files:")

327

path_length = len(CONFIG_FILES_PATH + os.path.sep)

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

328

for config in glob.glob(os.path.join(CONFIG_FILES_PATH, "*", "*.ini")):

Rickard Bolin

9b8b448

2022-05-24 07:43:03 +0000

[diff] [blame]

329

print(config[path_length:])

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

330

331

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

332

def main(args=None):

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

333

try:

334

if args is None:

335

args = sys.argv[1:]

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

336

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

337

parser = argparse.ArgumentParser(prog="vela", description="Neural network model compiler for Arm Ethos-U NPUs")

338

parser.add_argument("--version", action="version", version=__version__)

339

parser.add_argument(

340

"--api-version", action="version", version=API_VERSION, help="Displays the version of the external API."

341

)

342

parser.add_argument(

343

"--supported-ops-report",

344

action="store_true",

345

help="Generate the SUPPORTED_OPS.md file in the current working directory and exit",

Tim Hall

b9b515c

2020-11-01 21:27:19 +0000

[diff] [blame]

346

)

Jacob Bohlin

0628a8c

2020-08-28 13:25:14 +0200

[diff] [blame]

347

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

348

parser.add_argument(

349

"--list-config-files",

350

action="store_true",

351

help=(

352

"Display all available configurations in the `config_files` folder and exit. To select config file, "

353

"use the --config argument with one of the listed config files (For example: --config Arm/vela.ini )"

),

)

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

357

# set network nargs to be optional to allow the support-ops-report CLI option to be used standalone

parser.add_argument(

"network",

metavar="NETWORK",

type=str,

default=None,

nargs="?",

help="Filename of the input TensorFlow Lite for Microcontrollers network",

365

)

366

parser.add_argument(

367

"--output-dir", type=str, default="output", help="Output directory to write files to (default: %(default)s)"

)

parser.add_argument(

"--enable-debug-db",

action="store_true",

default=None,

help="Enables the calculation and writing of a network debug database to output directory",

)

parser.add_argument(

"--config",

type=str,

action="append",

help="Vela configuration file(s) in Python ConfigParser .ini file format",

380

)

381

parser.add_argument("--verbose-all", action="store_true", help="Enable all verbose options")

382

parser.add_argument(

383

"--verbose-config", action="store_true", help="Verbose system configuration and memory mode"

384

)

385

parser.add_argument("--verbose-graph", action="store_true", help="Verbose graph rewriter")

386

parser.add_argument("--verbose-quantization", action="store_true", help="Verbose quantization")

387

parser.add_argument("--verbose-packing", action="store_true", help="Verbose pass packing")

388

parser.add_argument("--verbose-tensor-purpose", action="store_true", help="Verbose tensor purpose")

389

parser.add_argument("--verbose-tensor-format", action="store_true", help="Verbose tensor format")

390

parser.add_argument("--verbose-schedule", action="store_true", help="Verbose schedule")

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

391

parser.add_argument("--verbose-allocation", action="store_true", help="Verbose tensor allocation")

392

parser.add_argument(

393

"--verbose-high-level-command-stream", action="store_true", help="Verbose high level command stream"

394

)

395

parser.add_argument(

396

"--verbose-register-command-stream", action="store_true", help="Verbose register command stream"

397

)

398

parser.add_argument("--verbose-operators", action="store_true", help="Verbose operator list")

Fredrik Svedberg

f5c07c4

2021-04-23 14:36:42 +0200

[diff] [blame]

399

parser.add_argument("--verbose-weights", action="store_true", help="Verbose weights information")

Tim Hall

c1be087

2022-03-03 17:50:52 +0000

[diff] [blame]

400

parser.add_argument("--verbose-performance", action="store_true", help="Verbose performance information")

Raul Farkas

1c54ac1

2023-04-26 07:49:15 +0100

[diff] [blame]

401

parser.add_argument("--verbose-progress", action="store_true", help="Verbose progress information")

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

402

parser.add_argument(

403

"--show-cpu-operations", action="store_true", help="Show the operations that fall back to the CPU"

404

)

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

405

parser.add_argument("--timing", action="store_true", help="Time the compiler doing operations")

406

parser.add_argument(

wilisa01

46c9477

2023-02-08 09:56:14 +0000

[diff] [blame]

407

"--force-symmetric-int-weights",

408

action="store_true",

409

help="Forces all zero points to 0 for signed integer weights",

410

)

411

parser.add_argument(

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

412

"--accelerator-config",

413

type=str,

414

default="ethos-u55-256",

415

choices=list(architecture_features.Accelerator.member_list()),

416

help="Accelerator configuration to use (default: %(default)s)",

)

parser.add_argument(

"--system-config",

type=str,

default=architecture_features.ArchitectureFeatures.DEFAULT_CONFIG,

422

help="System configuration to select from the Vela configuration file (default: %(default)s)",

)

parser.add_argument(

"--memory-mode",

type=str,

default=architecture_features.ArchitectureFeatures.DEFAULT_CONFIG,

428

help="Memory mode to select from the Vela configuration file (default: %(default)s)",

429

)

430

parser.add_argument(

431

"--tensor-allocator",

432

default=TensorAllocator.HillClimb,

433

type=lambda s: TensorAllocator[s],

434

choices=list(TensorAllocator),

435

help="Tensor Allocator algorithm (default: %(default)s)",

436

)

437

parser.add_argument(

438

"--show-subgraph-io-summary",

439

action="store_true",

440

help="Shows a summary of all the subgraphs and their inputs and outputs",

441

)

442

parser.add_argument(

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

443

"--max-block-dependency",

444

type=int,

445

default=architecture_features.ArchitectureFeatures.MAX_BLOCKDEP,

446

choices=range(0, architecture_features.ArchitectureFeatures.MAX_BLOCKDEP + 1),

447

help=(

448

"Set the maximum value that can be used for the block dependency between npu kernel operations"

449

" (default: %(default)s)"

450

),

451

)

452

parser.add_argument(

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

453

"--optimise",

454

type=lambda s: scheduler.OptimizationStrategy[s],

455

default=scheduler.OptimizationStrategy.Performance,

456

choices=list(scheduler.OptimizationStrategy),

457

help=(

458

"Set the optimisation strategy. The Size strategy results in minimal SRAM usage (does not use"

459

" arena-cache-size). The Performance strategy results in maximal performance (uses the arena-cache-size"

460

" if specified) (default: %(default)s)"

461

),

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

462

)

463

parser.add_argument(

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

464

"--arena-cache-size",

465

type=int,

466

help=(

467

"Set the size of the arena cache memory area, in bytes. If specified, this option overrides the memory"

468

" mode attribute with the same name in a Vela configuration file"

469

),

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

470

)

471

parser.add_argument(

472

"--cpu-tensor-alignment",

473

type=int,

474

default=Tensor.AllocationQuantum,

475

help=(

476

"Controls the allocation byte alignment of cpu tensors including Ethos-U Custom"

477

" operator inputs and outputs (default: %(default)s)"

478

),

479

)

Dwight Lidman

b9c9542

2021-08-18 19:24:14 +0200

[diff] [blame]

parser.add_argument(

"--recursion-limit",

type=int,

default=1000,

help="Set the recursion depth limit, may result in RecursionError if too low (default: %(default)s)",

485

)

Tim Hall

cda4fcb

2022-05-19 12:36:58 +0100

[diff] [blame]

486

parser.add_argument(

487

"--hillclimb-max-iterations",

488

type=int,

489

default=HillClimbAllocator.MAX_ITERATIONS,

490

help=(

491

"Set the maximum number of iterations the Hill Climb tensor allocator will run (default: %(default)s)"

492

),

493

)

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

494

args = parser.parse_args(args=args)

Louis Verhaard

5207830

2020-11-18 13:35:06 +0100

[diff] [blame]

495

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

496

# Generate the supported ops report and exit

497

if args.supported_ops_report:

498

generate_supported_ops()

499

return 0

Louis Verhaard

5207830

2020-11-18 13:35:06 +0100

[diff] [blame]

500

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

501

if args.list_config_files:

list_config_files()

return 0

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

505

if args.network is None:

506

parser.error("the following argument is required: NETWORK")

Michael McGeagh

2fa40ae

2020-12-02 10:55:04 +0000

[diff] [blame]

507

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

508

def _parse_config(config):

Rickard Bolin

7ce6b32

2022-06-02 09:30:33 +0000

[diff] [blame]

509

# Make sure the correct separator is used depending on OS

510

config = os.path.normpath(config)

511

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

512

if not config.endswith(".ini"):

513

raise InputFileError(config, "Configuration files must use the .ini extension")

514

Rickard Bolin

6d7a4f0

2022-05-24 14:17:58 +0000

[diff] [blame]

515

if (

516

len(config.split(os.path.sep)) == 2

517

and not config.startswith(os.path.sep)

518

and not config.startswith(".")

519

and not config.startswith("~")

520

):

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

521

config_path = os.path.join(CONFIG_FILES_PATH, config)

522

else:

Rickard Bolin

6d7a4f0

2022-05-24 14:17:58 +0000

[diff] [blame]

523

# Check if the configuration file is correctly placed inside the config_files directory

524

if os.access(os.path.join(CONFIG_FILES_PATH, *config.split(os.path.sep)[-2:]), os.R_OK):

525

rel_path = os.path.join(*config.split(os.path.sep)[-2:])

526

print(

527

f"Warning: Consider accessing the configuration by --config {rel_path} since it is located "

528

"inside the config_files directory."

529

)

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

530

config_path = config

531

532

if not os.access(config_path, os.R_OK):

Rickard Bolin

6d7a4f0

2022-05-24 14:17:58 +0000

[diff] [blame]

533

raise InputFileError(

534

config_path,

535

"File not found or is not readable. The configuration file is either not located in a folder "

536

"directly under the `config_files` directory or its path has not been provided correctly.",

537

)

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

return config_path

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

541

# check all config files exist because they will be read as a group

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

542

config_files = [_parse_config(cfg) for cfg in args.config] if args.config else None

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

543

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

544

if args.cpu_tensor_alignment < 16 or args.cpu_tensor_alignment & (args.cpu_tensor_alignment - 1) != 0:

545

parser.error(

546

"Invalid argument to --cpu-tensor-alignment = {} (must be greater than or equal to 16 and a power of 2)"

547

"".format(args.cpu_tensor_alignment)

548

)

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

549

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

550

if args.system_config == ArchitectureFeatures.DEFAULT_CONFIG:

551

print(f"Warning: Using {ArchitectureFeatures.DEFAULT_CONFIG} values for system configuration")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

552

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

553

if args.memory_mode == ArchitectureFeatures.DEFAULT_CONFIG:

554

print(f"Warning: Using {ArchitectureFeatures.DEFAULT_CONFIG} values for memory mode")

Tim Hall

2020-04-27 18:20:16 +0100

[diff] [blame]

555

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

556

if args.verbose_all:

557

for v in vars(args):

558

if v.startswith("verbose") and v != "verbose_all":

559

setattr(args, v, True)

560

Dwight Lidman

b9c9542

2021-08-18 19:24:14 +0200

[diff] [blame]

561

sys.setrecursionlimit(args.recursion_limit)

562

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

563

arch = architecture_features.ArchitectureFeatures(

Rickard Bolin

2022-04-25 11:07:56 +0000

[diff] [blame]

564

vela_config_files=config_files,

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

565

system_config=args.system_config,

566

memory_mode=args.memory_mode,

567

accelerator_config=args.accelerator_config,

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

568

max_blockdep=args.max_block_dependency,

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

569

verbose_config=args.verbose_config,

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

570

arena_cache_size=args.arena_cache_size,

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

571

)

572

573

compiler_options = compiler_driver.CompilerOptions(

574

verbose_graph=args.verbose_graph,

575

verbose_quantization=args.verbose_quantization,

576

verbose_packing=args.verbose_packing,

577

verbose_tensor_purpose=args.verbose_tensor_purpose,

578

verbose_tensor_format=args.verbose_tensor_format,

579

verbose_allocation=args.verbose_allocation,

580

verbose_high_level_command_stream=args.verbose_high_level_command_stream,

581

verbose_register_command_stream=args.verbose_register_command_stream,

582

verbose_operators=args.verbose_operators,

Fredrik Svedberg

f5c07c4

2021-04-23 14:36:42 +0200

[diff] [blame]

583

verbose_weights=args.verbose_weights,

Tim Hall

c1be087

2022-03-03 17:50:52 +0000

[diff] [blame]

584

verbose_performance=args.verbose_performance,

Raul Farkas

1c54ac1

2023-04-26 07:49:15 +0100

[diff] [blame]

585

verbose_progress=args.verbose_progress,

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

586

show_cpu_operations=args.show_cpu_operations,

587

tensor_allocator=args.tensor_allocator,

588

timing=args.timing,

wilisa01

46c9477

2023-02-08 09:56:14 +0000

[diff] [blame]

589

force_symmetric_int_weights=args.force_symmetric_int_weights,

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

590

output_dir=args.output_dir,

591

cpu_tensor_alignment=args.cpu_tensor_alignment,

Tim Hall

cda4fcb

2022-05-19 12:36:58 +0100

[diff] [blame]

592

hillclimb_max_iterations=args.hillclimb_max_iterations,

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

593

)

594

595

scheduler_options = scheduler.SchedulerOptions(

Tim Hall

2021-05-27 18:49:40 +0100

[diff] [blame]

596

optimization_strategy=args.optimise,

597

sram_target=arch.arena_cache_size,

Henrik G Olsson

2021-03-23 17:34:49 +0100

[diff] [blame]

598

verbose_schedule=args.verbose_schedule,

Raul Farkas

1c54ac1

2023-04-26 07:49:15 +0100

[diff] [blame]

599

verbose_progress=args.verbose_progress,

Henrik G Olsson