blob: 7edd1822aecbe89ab3c6e64e6a0a2bc38dec8e02 [file] [log] [blame]
Giorgio Arenaa66eaa22017-12-21 19:50:06 +00001/*
2 * Copyright (c) 2017-2018 ARM Limited.
3 *
4 * SPDX-License-Identifier: MIT
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to
8 * deal in the Software without restriction, including without limitation the
9 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10 * sell copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in all
14 * copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 */
Georgios Pinitasd9eb2752018-04-03 13:44:29 +010024#include "arm_compute/graph.h"
Giorgio Arenaa66eaa22017-12-21 19:50:06 +000025#include "support/ToolchainSupport.h"
26#include "utils/GraphUtils.h"
27#include "utils/Utils.h"
28
Georgios Pinitasd9eb2752018-04-03 13:44:29 +010029#include <cstdlib>
30
Giorgio Arenabb54e4e2018-04-05 17:20:34 +010031using namespace arm_compute;
Georgios Pinitasd9eb2752018-04-03 13:44:29 +010032using namespace arm_compute::utils;
33using namespace arm_compute::graph::frontend;
Giorgio Arenaa66eaa22017-12-21 19:50:06 +000034using namespace arm_compute::graph_utils;
35
36/** Example demonstrating how to implement QASYMM8 MobileNet's network using the Compute Library's graph API
37 *
38 * @param[in] argc Number of arguments
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +000039 * @param[in] argv Arguments ( [optional] Target (0 = NEON, 1 = OpenCL, 2 = OpenCL with Tuner), [optional] Path to the weights folder, [optional] npy_input, [optional] labels )
Giorgio Arenaa66eaa22017-12-21 19:50:06 +000040 */
Georgios Pinitasd9eb2752018-04-03 13:44:29 +010041class GraphMobileNetQASYMM8Example : public Example
Giorgio Arenaa66eaa22017-12-21 19:50:06 +000042{
43public:
44 void do_setup(int argc, char **argv) override
45 {
46 std::string data_path; /* Path to the trainable data */
47 std::string input; /* Image data */
48 std::string label; /* Label data */
49
50 // Quantization info taken from the AndroidNN QASYMM8 MobileNet example
51 const QuantizationInfo in_quant_info = QuantizationInfo(0.0078125f, 128);
52 const QuantizationInfo mid_quant_info = QuantizationInfo(0.0784313753247f, 128);
53
54 const std::vector<QuantizationInfo> conv_weights_quant_info =
55 {
56 QuantizationInfo(0.031778190285f, 156), // conv0
57 QuantizationInfo(0.00604454148561f, 66) // conv14
58 };
59
60 const std::vector<QuantizationInfo> depth_weights_quant_info =
61 {
62 QuantizationInfo(0.254282623529f, 129), // dwsc1
63 QuantizationInfo(0.12828284502f, 172), // dwsc2
64 QuantizationInfo(0.265911251307f, 83), // dwsc3
65 QuantizationInfo(0.0985597148538f, 30), // dwsc4
66 QuantizationInfo(0.0631204470992f, 54), // dwsc5
67 QuantizationInfo(0.0137207424268f, 141), // dwsc6
68 QuantizationInfo(0.0817828401923f, 125), // dwsc7
69 QuantizationInfo(0.0393880493939f, 164), // dwsc8
70 QuantizationInfo(0.211694166064f, 129), // dwsc9
71 QuantizationInfo(0.158015936613f, 103), // dwsc10
72 QuantizationInfo(0.0182712618262f, 137), // dwsc11
73 QuantizationInfo(0.0127998134121f, 134), // dwsc12
74 QuantizationInfo(0.299285322428f, 161) // dwsc13
75 };
76
77 const std::vector<QuantizationInfo> point_weights_quant_info =
78 {
79 QuantizationInfo(0.0425766184926f, 129), // dwsc1
80 QuantizationInfo(0.0250773020089f, 94), // dwsc2
81 QuantizationInfo(0.015851572156f, 93), // dwsc3
82 QuantizationInfo(0.0167811904103f, 98), // dwsc4
83 QuantizationInfo(0.00951790809631f, 135), // dwsc5
84 QuantizationInfo(0.00999817531556f, 128), // dwsc6
85 QuantizationInfo(0.00590536883101f, 126), // dwsc7
86 QuantizationInfo(0.00576109671965f, 133), // dwsc8
87 QuantizationInfo(0.00830461271107f, 142), // dwsc9
88 QuantizationInfo(0.0152327232063f, 72), // dwsc10
89 QuantizationInfo(0.00741417845711f, 125), // dwsc11
90 QuantizationInfo(0.0135628981516f, 142), // dwsc12
91 QuantizationInfo(0.0338749065995f, 140) // dwsc13
92 };
93
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +000094 // Set target. 0 (NEON), 1 (OpenCL), 2 (OpenCL with Tuner). By default it is NEON
Giorgio Arenabb54e4e2018-04-05 17:20:34 +010095 const int target = argc > 1 ? std::strtol(argv[1], nullptr, 10) : 0;
96 Target target_hint = set_target_hint(target);
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +000097
Giorgio Arenaa66eaa22017-12-21 19:50:06 +000098 // Parse arguments
99 if(argc < 2)
100 {
101 // Print help
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +0000102 std::cout << "Usage: " << argv[0] << " [target] [path_to_data] [npy_input] [labels]\n\n";
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000103 std::cout << "No data folder provided: using random values\n\n";
104 }
105 else if(argc == 2)
106 {
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +0000107 std::cout << "Usage: " << argv[0] << " " << argv[1] << " [path_to_data] [npy_input] [labels]\n\n";
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000108 std::cout << "No input provided: using random values\n\n";
109 }
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +0000110 else if(argc == 4)
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000111 {
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +0000112 data_path = argv[2];
113 input = argv[3];
114 std::cout << "Usage: " << argv[0] << " " << argv[1] << " " << argv[2] << " " << argv[3] << " [labels]\n\n";
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000115 std::cout << "No text file with labels provided: skipping output accessor\n\n";
116 }
117 else
118 {
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +0000119 data_path = argv[2];
120 input = argv[3];
121 label = argv[4];
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000122 }
123
Michele Di Giorgioe3fba0a2018-02-14 14:18:01 +0000124 graph << target_hint
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100125 << DepthwiseConvolutionMethod::OPTIMIZED_3x3 // FIXME(COMPMID-1073): Add heuristics to automatically call the optimized 3x3 method
126 << InputLayer(TensorDescriptor(TensorShape(224U, 224U, 3U, 1U), DataType::QASYMM8, in_quant_info),
127 get_weights_accessor(data_path, "/cnn_data/mobilenet_qasymm8_model/" + input))
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000128 << ConvolutionLayer(
129 3U, 3U, 32U,
130 get_weights_accessor(data_path, "/cnn_data/mobilenet_qasymm8_model/Conv2d_0_weights.npy"),
131 get_weights_accessor(data_path, "/cnn_data/mobilenet_qasymm8_model/Conv2d_0_bias.npy"),
132 PadStrideInfo(2U, 2U, 0U, 1U, 0U, 1U, DimensionRoundingType::FLOOR),
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100133 1, conv_weights_quant_info.at(0), mid_quant_info)
134 << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU, 6.f));
135 graph << get_dwsc_node(data_path, "Conv2d_1", 64U, PadStrideInfo(1U, 1U, 1U, 1U), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(0), point_weights_quant_info.at(0));
136 graph << get_dwsc_node(data_path, "Conv2d_2", 128U, PadStrideInfo(2U, 2U, 0U, 1U, 0U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(1),
137 point_weights_quant_info.at(1));
138 graph << get_dwsc_node(data_path, "Conv2d_3", 128U, PadStrideInfo(1U, 1U, 1U, 1U, 1U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(2),
139 point_weights_quant_info.at(2));
140 graph << get_dwsc_node(data_path, "Conv2d_4", 256U, PadStrideInfo(2U, 2U, 0U, 1U, 0U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(3),
141 point_weights_quant_info.at(3));
142 graph << get_dwsc_node(data_path, "Conv2d_5", 256U, PadStrideInfo(1U, 1U, 1U, 1U, 1U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(4),
143 point_weights_quant_info.at(4));
144 graph << get_dwsc_node(data_path, "Conv2d_6", 512U, PadStrideInfo(2U, 2U, 0U, 1U, 0U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(5),
145 point_weights_quant_info.at(5));
146 graph << get_dwsc_node(data_path, "Conv2d_7", 512U, PadStrideInfo(1U, 1U, 1U, 1U, 1U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(6),
147 point_weights_quant_info.at(6));
148 graph << get_dwsc_node(data_path, "Conv2d_8", 512U, PadStrideInfo(1U, 1U, 1U, 1U, 1U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(7),
149 point_weights_quant_info.at(7));
150 graph << get_dwsc_node(data_path, "Conv2d_9", 512U, PadStrideInfo(1U, 1U, 1U, 1U, 1U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(8),
151 point_weights_quant_info.at(8));
152 graph << get_dwsc_node(data_path, "Conv2d_10", 512U, PadStrideInfo(1U, 1U, 1U, 1U, 1U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(9),
153 point_weights_quant_info.at(9));
154 graph << get_dwsc_node(data_path, "Conv2d_11", 512U, PadStrideInfo(1U, 1U, 1U, 1U, 1U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(10),
155 point_weights_quant_info.at(10));
156 graph << get_dwsc_node(data_path, "Conv2d_12", 1024U, PadStrideInfo(2U, 2U, 0U, 1U, 0U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(11),
157 point_weights_quant_info.at(11));
158 graph << get_dwsc_node(data_path, "Conv2d_13", 1024U, PadStrideInfo(1U, 1U, 1U, 1U, 1U, 1U, DimensionRoundingType::FLOOR), PadStrideInfo(1U, 1U, 0U, 0U), depth_weights_quant_info.at(12),
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000159 point_weights_quant_info.at(12))
160 << PoolingLayer(PoolingLayerInfo(PoolingType::AVG))
161 << ConvolutionLayer(
162 1U, 1U, 1001U,
163 get_weights_accessor(data_path, "/cnn_data/mobilenet_qasymm8_model/Logits_Conv2d_1c_1x1_weights.npy"),
164 get_weights_accessor(data_path, "/cnn_data/mobilenet_qasymm8_model/Logits_Conv2d_1c_1x1_bias.npy"),
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100165 PadStrideInfo(1U, 1U, 0U, 0U), 1, conv_weights_quant_info.at(1))
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000166 << ReshapeLayer(TensorShape(1001U))
167 << SoftmaxLayer()
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100168 << OutputLayer(get_output_accessor(label, 5));
Gian Marcoc1b6e372018-02-21 18:03:26 +0000169
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100170 // Finalize graph
171 GraphConfig config;
Georgios Pinitas3d1489d2018-05-03 20:47:16 +0100172 config.use_tuner = (target == 2);
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100173 graph.finalize(target_hint, config);
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000174 }
175 void do_run() override
176 {
177 // Run graph
178 graph.run();
179 }
180
181private:
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100182 Stream graph{ 0, "MobileNetV1_QASYMM8" };
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000183
184 /** This function produces a depthwise separable convolution node (i.e. depthwise + pointwise layers) with ReLU6 activation after each layer.
185 *
186 * @param[in] data_path Path to trainable data folder
187 * @param[in] param_path Prefix of specific set of weights/biases data
188 * @param[in] conv_filt Filters depths for pointwise convolution
189 * @param[in] dwc_pad_stride_info PadStrideInfo for depthwise convolution
190 * @param[in] conv_pad_stride_info PadStrideInfo for pointwise convolution
191 * @param[in] depth_weights_quant_info QuantizationInfo for depthwise convolution's weights
192 * @param[in] point_weights_quant_info QuantizationInfo for pointwise convolution's weights
193 *
194 * @return The complete dwsc node
195 */
196 BranchLayer get_dwsc_node(const std::string &data_path, std::string &&param_path,
197 const unsigned int conv_filt,
198 PadStrideInfo dwc_pad_stride_info, PadStrideInfo conv_pad_stride_info,
199 QuantizationInfo depth_weights_quant_info, QuantizationInfo point_weights_quant_info)
200 {
201 std::string total_path = "/cnn_data/mobilenet_qasymm8_model/" + param_path + "_";
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100202 SubStream sg(graph);
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000203
204 sg << DepthwiseConvolutionLayer(
205 3U, 3U,
206 get_weights_accessor(data_path, total_path + "depthwise_weights.npy"),
207 get_weights_accessor(data_path, total_path + "depthwise_bias.npy"),
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100208 dwc_pad_stride_info, depth_weights_quant_info)
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000209 << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU, 6.f))
210 << ConvolutionLayer(
211 1U, 1U, conv_filt,
212 get_weights_accessor(data_path, total_path + "pointwise_weights.npy"),
213 get_weights_accessor(data_path, total_path + "pointwise_bias.npy"),
Giorgio Arenabb54e4e2018-04-05 17:20:34 +0100214 conv_pad_stride_info, 1, point_weights_quant_info)
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000215 << ActivationLayer(ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU, 6.f));
216
217 return BranchLayer(std::move(sg));
218 }
219};
220/** Main program for MobileNetQASYMM8
221 *
222 * @param[in] argc Number of arguments
223 * @param[in] argv Arguments ( [optional] Path to the weights folder, [optional] npy_input, [optional] labels )
224 */
225int main(int argc, char **argv)
226{
Georgios Pinitasd9eb2752018-04-03 13:44:29 +0100227 return arm_compute::utils::run_example<GraphMobileNetQASYMM8Example>(argc, argv);
Giorgio Arenaa66eaa22017-12-21 19:50:06 +0000228}