blob: c0ee8222d319e0c6eeaa57f5141615a999cb0a4f [file] [log] [blame]
Jonathan Strandbergd2afc512021-03-19 10:31:18 +01001#!/usr/bin/env python3
2
3#
4# Copyright (c) 2021 Arm Limited. All rights reserved.
5#
6# SPDX-License-Identifier: Apache-2.0
7#
8# Licensed under the Apache License, Version 2.0 (the License); you may
9# not use this file except in compliance with the License.
10# You may obtain a copy of the License at
11#
12# www.apache.org/licenses/LICENSE-2.0
13#
14# Unless required by applicable law or agreed to in writing, software
15# distributed under the License is distributed on an AS IS BASIS, WITHOUT
16# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17# See the License for the specific language governing permissions and
18# limitations under the License.
19#
20
21import argparse
22import multiprocessing
23import numpy
24import os
25import pathlib
26import re
27import shutil
28import subprocess
29import sys
30
31os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
Kristofer Jonssonffbd8e72021-06-15 17:51:58 +020032from tensorflow.lite.python.interpreter import Interpreter, OpResolverType
Jonathan Strandbergd2afc512021-03-19 10:31:18 +010033
34CORE_PLATFORM_PATH = pathlib.Path(__file__).resolve().parents[1]
35
36def run_cmd(cmd, **kwargs):
37 # str() is called to handle pathlib.Path objects
38 cmd_str = " ".join([str(arg) for arg in cmd])
39 print(f"Running command: {cmd_str}")
40 return subprocess.run(cmd, check=True, **kwargs)
41
Nir Ekhauz4756bf12021-06-27 11:20:24 +030042
43def build_core_platform(output_folder, target, toolchain, pmu):
Jonathan Strandbergd2afc512021-03-19 10:31:18 +010044 build_folder = output_folder/"model"/"build"
Nir Ekhauz4756bf12021-06-27 11:20:24 +030045 inner_pmu = [0, 0, 0, 0]
46 for idx in range(len(pmu)):
47 inner_pmu[idx] = pmu[idx]
Jonathan Strandbergd2afc512021-03-19 10:31:18 +010048 cmake_cmd = ["cmake",
49 CORE_PLATFORM_PATH/"targets"/target,
50 f"-B{build_folder}",
51 f"-DCMAKE_TOOLCHAIN_FILE={CORE_PLATFORM_PATH/'cmake'/'toolchain'/(toolchain + '.cmake')}",
Nir Ekhauz4756bf12021-06-27 11:20:24 +030052 f"-DBAREMETAL_PATH={output_folder}",
53 f"-DETHOSU_PMU_EVENT_0={inner_pmu[0]}",
54 f"-DETHOSU_PMU_EVENT_1={inner_pmu[1]}",
55 f"-DETHOSU_PMU_EVENT_2={inner_pmu[2]}",
56 f"-DETHOSU_PMU_EVENT_3={inner_pmu[3]}"]
Jonathan Strandbergd2afc512021-03-19 10:31:18 +010057
58 run_cmd(cmake_cmd)
59
Kristofer Jonssonffbd8e72021-06-15 17:51:58 +020060 make_cmd = ["make", "-C", build_folder, f"-j{multiprocessing.cpu_count()}", "baremetal_custom"]
Jonathan Strandbergd2afc512021-03-19 10:31:18 +010061 run_cmd(make_cmd)
62
63def generate_reference_data(output_folder, non_optimized_model_path, input_path, expected_output_path):
Kristofer Jonssonffbd8e72021-06-15 17:51:58 +020064 interpreter = Interpreter(model_path=str(non_optimized_model_path.resolve()), experimental_op_resolver_type=OpResolverType.BUILTIN_REF)
Jonathan Strandbergd2afc512021-03-19 10:31:18 +010065
66 interpreter.allocate_tensors()
67 input_detail = interpreter.get_input_details()[0]
68 output_detail = interpreter.get_output_details()[0]
69
70 input_data = None
71 if input_path is None:
72 # Randomly generate input data
73 dtype = input_detail["dtype"]
74 if dtype is numpy.float32:
75 rand = numpy.random.default_rng()
76 input_data = rand.random(size=input_detail["shape"], dtype=numpy.float32)
77 else:
78 input_data = numpy.random.randint(low=numpy.iinfo(dtype).min, high=numpy.iinfo(dtype).max, size=input_detail["shape"], dtype=dtype)
79 else:
80 # Load user provided input data
81 input_data = numpy.load(input_path)
82
83 output_data = None
84 if expected_output_path is None:
85 # Run the network with input_data to get reference output
86 interpreter.set_tensor(input_detail["index"], input_data)
87 interpreter.invoke()
88 output_data = interpreter.get_tensor(output_detail["index"])
89 else:
90 # Load user provided output data
91 output_data = numpy.load(expected_output_path)
92
93 network_input_path = output_folder/"ref_input.bin"
94 network_output_path = output_folder/"ref_output.bin"
95
96 with network_input_path.open("wb") as fp:
97 fp.write(input_data.tobytes())
98 with network_output_path.open("wb") as fp:
99 fp.write(output_data.tobytes())
100
101 output_folder = pathlib.Path(output_folder)
102 dump_c_header(network_input_path, output_folder/"input.h", "inputData", "input_data_sec", 4)
103 dump_c_header(network_output_path, output_folder/"output.h", "expectedOutputData", "expected_output_data_sec", 4)
104
105def dump_c_header(input_path, output_path, array_name, section, alignment, extra_data=""):
106 byte_array = []
107 with open(input_path, "rb") as fp:
108 byte_string = fp.read()
109 byte_array = [f"0x{format(byte, '02x')}" for byte in byte_string]
110
111 last = byte_array[-1]
112 byte_array = [byte + "," for byte in byte_array[:-1]] + [last]
113
114 byte_array = [" " + byte if idx % 12 == 0 else byte
115 for idx, byte in enumerate(byte_array)]
116
117 byte_array = [byte + "\n" if (idx + 1) % 12 == 0 else byte + " "
118 for idx, byte in enumerate(byte_array)]
119
120 with open(output_path, "w") as carray:
121 header = f"uint8_t {array_name}[] __attribute__((section(\"{section}\"), aligned({alignment}))) = {{\n"
122 carray.write(extra_data)
123 carray.write(header)
124 carray.write("".join(byte_array))
125 carray.write("\n};\n")
126
127def optimize_network(output_folder, network_path, accelerator_conf):
128 vela_cmd = ["vela",
129 network_path,
130 "--output-dir", output_folder,
131 "--accelerator-config", accelerator_conf]
132 res = run_cmd(vela_cmd)
133 optimized_model_path = output_folder/(network_path.stem + "_vela.tflite")
134 model_name = network_path.stem
135 dump_c_header(optimized_model_path, output_folder/"model.h", "networkModelData", "network_model_sec", 16, extra_data=f"const char *modelName=\"{model_name}\";\n")
136
137def run_model(output_folder):
138 build_folder = output_folder/"model"/"build"
139 model_cmd = ["ctest", "-V", "-R", "^baremetal_custom$" ]
140 res = run_cmd(model_cmd, cwd=build_folder)
141
142def main():
143 target_mapping = {
144 "corstone-300": "ethos-u55-128"
145 }
146 parser = argparse.ArgumentParser()
147 parser.add_argument("-o", "--output-folder", type=pathlib.Path, default="output", help="Output folder for build and generated files")
Nir Ekhauz4756bf12021-06-27 11:20:24 +0300148 parser.add_argument("--pmu", type=int, action='append', help="PMU Event Counters")
Jonathan Strandbergd2afc512021-03-19 10:31:18 +0100149 parser.add_argument("--network-path", type=pathlib.Path, required=True, help="Path to .tflite file")
150 parser.add_argument("--target", choices=target_mapping, default="corstone-300", help=f"Configure target")
151 parser.add_argument("--toolchain", choices=["armclang", "arm-none-eabi-gcc"], default="armclang", help=f"Configure toolchain")
152 parser.add_argument("--custom-input", type=pathlib.Path, help="Custom input to network")
153 parser.add_argument("--custom-output", type=pathlib.Path, help="Custom expected output data for network")
154
155 args = parser.parse_args()
Jonathan Strandbergd2afc512021-03-19 10:31:18 +0100156 args.output_folder.mkdir(exist_ok=True)
157
158 try:
159 optimize_network(args.output_folder, args.network_path, target_mapping[args.target])
160 generate_reference_data(args.output_folder, args.network_path, args.custom_input, args.custom_output)
Nir Ekhauz4756bf12021-06-27 11:20:24 +0300161 build_core_platform(args.output_folder, args.target, args.toolchain, args.pmu)
Jonathan Strandbergd2afc512021-03-19 10:31:18 +0100162 run_model(args.output_folder)
163 except subprocess.CalledProcessError as err:
164 print(f"Command: '{err.cmd}' failed", file=sys.stderr)
165 return 1
166 return 0
167
168if __name__ == "__main__":
169 sys.exit(main())