blob: 5645503ca36a86592c06e0644f0fb0b59aad8d05 [file] [log] [blame]
telsoa01c577f2c2018-08-31 09:22:23 +01001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa01c577f2c2018-08-31 09:22:23 +01004//
5#pragma once
6
7#include "armnn/INetwork.hpp"
8#include "armnnTfLiteParser/ITfLiteParser.hpp"
Nattapat Chaimanowongb66504b2018-10-17 15:19:14 +01009#include "armnn/Types.hpp"
telsoa01c577f2c2018-08-31 09:22:23 +010010
11#include <schema_generated.h>
12#include <functional>
Aron Virginas-Tarc975f922019-10-23 17:38:17 +010013#include <unordered_map>
telsoa01c577f2c2018-08-31 09:22:23 +010014#include <vector>
15
16namespace armnnTfLiteParser
17{
18
Kevin May7d96b162021-02-03 17:38:41 +000019class TfLiteParserImpl
telsoa01c577f2c2018-08-31 09:22:23 +010020{
21public:
22 // Shorthands for TfLite types
23 using ModelPtr = std::unique_ptr<tflite::ModelT>;
Derek Lambertiff05cc52019-04-26 13:05:17 +010024 using SubgraphPtr = std::unique_ptr<tflite::SubGraphT>;
telsoa01c577f2c2018-08-31 09:22:23 +010025 using OperatorPtr = std::unique_ptr<tflite::OperatorT>;
26 using OperatorCodePtr = std::unique_ptr<tflite::OperatorCodeT>;
27 using TensorPtr = std::unique_ptr<tflite::TensorT>;
28 using TensorRawPtr = const tflite::TensorT *;
29 using TensorRawPtrVector = std::vector<TensorRawPtr>;
30 using TensorIdRawPtr = std::pair<size_t, TensorRawPtr>;
31 using TensorIdRawPtrVector = std::vector<TensorIdRawPtr>;
32 using BufferPtr = std::unique_ptr<tflite::BufferT>;
33 using BufferRawPtr = const tflite::BufferT *;
34
35public:
36 /// Create the network from a flatbuffers binary file on disk
Kevin May7d96b162021-02-03 17:38:41 +000037 armnn::INetworkPtr CreateNetworkFromBinaryFile(const char* graphFile);
telsoa01c577f2c2018-08-31 09:22:23 +010038
39 /// Create the network from a flatbuffers binary
Kevin May7d96b162021-02-03 17:38:41 +000040 armnn::INetworkPtr CreateNetworkFromBinary(const std::vector<uint8_t> & binaryContent);
telsoa01c577f2c2018-08-31 09:22:23 +010041
42
43 /// Retrieve binding info (layer id and tensor info) for the network input identified by
44 /// the given layer name and subgraph id
Kevin May7d96b162021-02-03 17:38:41 +000045 BindingPointInfo GetNetworkInputBindingInfo(size_t subgraphId,
46 const std::string& name) const;
telsoa01c577f2c2018-08-31 09:22:23 +010047
48 /// Retrieve binding info (layer id and tensor info) for the network output identified by
49 /// the given layer name and subgraph id
Kevin May7d96b162021-02-03 17:38:41 +000050 BindingPointInfo GetNetworkOutputBindingInfo(size_t subgraphId,
51 const std::string& name) const;
telsoa01c577f2c2018-08-31 09:22:23 +010052
53 /// Return the number of subgraphs in the parsed model
Kevin May7d96b162021-02-03 17:38:41 +000054 size_t GetSubgraphCount() const;
telsoa01c577f2c2018-08-31 09:22:23 +010055
56 /// Return the input tensor names for a given subgraph
Kevin May7d96b162021-02-03 17:38:41 +000057 std::vector<std::string> GetSubgraphInputTensorNames(size_t subgraphId) const;
telsoa01c577f2c2018-08-31 09:22:23 +010058
59 /// Return the output tensor names for a given subgraph
Kevin May7d96b162021-02-03 17:38:41 +000060 std::vector<std::string> GetSubgraphOutputTensorNames(size_t subgraphId) const;
telsoa01c577f2c2018-08-31 09:22:23 +010061
Kevin May7d96b162021-02-03 17:38:41 +000062 TfLiteParserImpl(const armnn::Optional<ITfLiteParser::TfLiteParserOptions>& options = armnn::EmptyOptional());
63 ~TfLiteParserImpl() = default;
telsoa01c577f2c2018-08-31 09:22:23 +010064
65public:
66 // testable helpers
Finn Williamsb49ed182021-06-29 15:50:08 +010067 armnn::INetworkPtr CreateNetworkFromBinaryAsDynamic(const std::vector<uint8_t>& binaryContent);
68
69 armnn::INetworkPtr LoadModel(std::unique_ptr<tflite::ModelT> model);
70
Teresa Charlin3ab85482021-06-08 16:59:29 +010071 static ModelPtr LoadModelFromFile(const char* fileName);
72 static ModelPtr LoadModelFromBinary(const uint8_t* binaryContent, size_t len);
73 static TensorRawPtrVector GetInputs(const ModelPtr& model, size_t subgraphIndex, size_t operatorIndex);
74 static TensorRawPtrVector GetOutputs(const ModelPtr& model, size_t subgraphIndex, size_t operatorIndex);
75 static TensorIdRawPtrVector GetSubgraphInputs(const ModelPtr& model, size_t subgraphIndex);
76 static TensorIdRawPtrVector GetSubgraphOutputs(const ModelPtr& model, size_t subgraphIndex);
telsoa01c577f2c2018-08-31 09:22:23 +010077 static std::vector<int32_t>& GetInputTensorIds(const ModelPtr& model, size_t subgraphIndex, size_t operatorIndex);
78 static std::vector<int32_t>& GetOutputTensorIds(const ModelPtr& model, size_t subgraphIndex, size_t operatorIndex);
79
80 static BufferRawPtr GetBuffer(const ModelPtr& model, size_t bufferIndex);
Teresa Charlin3ab85482021-06-08 16:59:29 +010081 static armnn::TensorInfo OutputShapeOfSqueeze(std::vector<uint32_t> squeezeDims,
82 const armnn::TensorInfo& inputTensorInfo);
83 static armnn::TensorInfo OutputShapeOfReshape(const armnn::TensorInfo& inputTensorInfo,
84 const std::vector<int32_t>& targetDimsIn);
telsoa01c577f2c2018-08-31 09:22:23 +010085
Matthew Sloyanac001ee2021-02-03 10:43:04 +000086 /// Retrieve version in X.Y.Z form
87 static const std::string GetVersion();
88
telsoa01c577f2c2018-08-31 09:22:23 +010089private:
Finn Williamsd4fa5452021-03-01 12:31:41 +000090
telsoa01c577f2c2018-08-31 09:22:23 +010091 // No copying allowed until it is wanted and properly implemented
Kevin May7d96b162021-02-03 17:38:41 +000092 TfLiteParserImpl(const TfLiteParserImpl &) = delete;
93 TfLiteParserImpl & operator=(const TfLiteParserImpl &) = delete;
telsoa01c577f2c2018-08-31 09:22:23 +010094
95 /// Create the network from an already loaded flatbuffers model
96 armnn::INetworkPtr CreateNetworkFromModel();
97
98 // signature for the parser functions
Kevin May7d96b162021-02-03 17:38:41 +000099 using OperatorParsingFunction = void(TfLiteParserImpl::*)(size_t subgraphIndex, size_t operatorIndex);
telsoa01c577f2c2018-08-31 09:22:23 +0100100
Aron Virginas-Tarc975f922019-10-23 17:38:17 +0100101 void ParseCustomOperator(size_t subgraphIndex, size_t operatorIndex);
telsoa01c577f2c2018-08-31 09:22:23 +0100102 void ParseUnsupportedOperator(size_t subgraphIndex, size_t operatorIndex);
Aron Virginas-Tarc975f922019-10-23 17:38:17 +0100103
Matthew Sloyaned7fce42021-04-15 20:46:24 +0100104 void ParseAbs(size_t subgraphIndex, size_t operatorIndex);
Finn Williamsc42c3842019-01-22 14:18:11 +0000105 void ParseActivation(size_t subgraphIndex, size_t operatorIndex, armnn::ActivationFunction activationType);
Nina Drozd200e3802019-04-15 09:47:39 +0100106 void ParseAdd(size_t subgraphIndex, size_t operatorIndex);
Matthew Sloyan28f177c2021-04-09 14:38:52 +0100107 void ParseArgMinMax(size_t subgraphIndex, size_t operatorIndex, armnn::ArgMinMaxFunction argMinMaxFunction);
108 void ParseArgMin(size_t subgraphIndex, size_t operatorIndex);
109 void ParseArgMax(size_t subgraphIndex, size_t operatorIndex);
telsoa01c577f2c2018-08-31 09:22:23 +0100110 void ParseAveragePool2D(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalvesdb947e22019-02-08 18:52:21 -0200111 void ParseBatchToSpaceND(size_t subgraphIndex, size_t operatorIndex);
mathad01b392e982021-04-07 12:07:30 +0100112 void ParseCast(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalves2d0eb862021-07-11 14:10:15 -0300113 void ParseComparison(size_t subgraphIndex, size_t operatorIndex, armnn::ComparisonOperation comparisonOperation);
Sadik Armagan479045b2018-10-01 11:51:37 +0100114 void ParseConcatenation(size_t subgraphIndex, size_t operatorIndex);
telsoa01c577f2c2018-08-31 09:22:23 +0100115 void ParseConv2D(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan26868492021-01-22 14:25:31 +0000116 void ParseDepthToSpace(size_t subgraphIndex, size_t operatorIndex);
telsoa01c577f2c2018-08-31 09:22:23 +0100117 void ParseDepthwiseConv2D(size_t subgraphIndex, size_t operatorIndex);
Finn Williamsed66d142019-12-06 09:55:55 +0000118 void ParseDequantize(size_t subgraphIndex, size_t operatorIndex);
keidav011b3e2ea2019-02-21 10:07:37 +0000119 void ParseDetectionPostProcess(size_t subgraphIndex, size_t operatorIndex);
Matthew Sloyan28f177c2021-04-09 14:38:52 +0100120 void ParseDiv(size_t subgraphIndex, size_t operatorIndex);
Matthew Sloyaned7fce42021-04-15 20:46:24 +0100121 void ParseElementwiseUnary(size_t subgraphIndex, size_t operatorIndex, armnn::UnaryOperation unaryOperation);
Matthew Sloyan7515d072020-12-16 12:50:01 +0000122 void ParseElu(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalves2d0eb862021-07-11 14:10:15 -0300123 void ParseEqual(size_t subgraphIndex, size_t operatorIndex);
Derek Lambertif0176992020-04-28 13:37:49 +0100124 void ParseExp(size_t subgraphIndex, size_t operatorIndex);
Teresa Charlin3ab85482021-06-08 16:59:29 +0100125 void ParseExpandDims(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan8853c1f2018-10-22 09:04:18 +0100126 void ParseFullyConnected(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan26868492021-01-22 14:25:31 +0000127 void ParseGather(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalves2d0eb862021-07-11 14:10:15 -0300128 void ParseGreater(size_t subgraphIndex, size_t operatorIndex);
129 void ParseGreaterOrEqual(size_t subgraphIndex, size_t operatorIndex);
Jan Eilers2f746b32020-07-28 14:00:06 +0100130 void ParseHardSwish(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan12239e72020-05-27 11:06:17 +0100131 void ParseLeakyRelu(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalves2d0eb862021-07-11 14:10:15 -0300132 void ParseLess(size_t subgraphIndex, size_t operatorIndex);
133 void ParseLessOrEqual(size_t subgraphIndex, size_t operatorIndex);
Mike Kelly31dce2b2021-09-01 21:22:37 +0100134 void ParseLocalResponseNormalization(size_t subgraphIndex, size_t operatorIndex);
Matthew Sloyaned7fce42021-04-15 20:46:24 +0100135 void ParseLogicalNot(size_t subgraphIndex, size_t operatorIndex);
Finn Williamsc42c3842019-01-22 14:18:11 +0000136 void ParseLogistic(size_t subgraphIndex, size_t operatorIndex);
Matthew Jackson28c94572019-07-18 10:47:03 +0100137 void ParseL2Normalization(size_t subgraphIndex, size_t operatorIndex);
Nattapat Chaimanowongb66504b2018-10-17 15:19:14 +0100138 void ParseMaxPool2D(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalvesb8d805e2019-02-12 22:57:13 -0200139 void ParseMaximum(size_t subgraphIndex, size_t operatorIndex);
Nina Drozd200e3802019-04-15 09:47:39 +0100140 void ParseMean(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalves8f6d7a72019-02-12 22:58:18 -0200141 void ParseMinimum(size_t subgraphIndex, size_t operatorIndex);
Nina Drozd200e3802019-04-15 09:47:39 +0100142 void ParseMul(size_t subgraphIndex, size_t operatorIndex);
Darshan Patel83fcf982020-05-26 22:22:42 +0530143 void ParseNeg(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalves2d0eb862021-07-11 14:10:15 -0300144 void ParseNotEqual(size_t subgraphIndex, size_t operatorIndex);
Matthew Jacksonbcca1f42019-07-16 11:39:21 +0100145 void ParsePack(size_t subgraphIndex, size_t operatorIndex);
Nina Drozd200e3802019-04-15 09:47:39 +0100146 void ParsePad(size_t subgraphIndex, size_t operatorIndex);
147 void ParsePool(size_t subgraphIndex, size_t operatorIndex, armnn::PoolingAlgorithm algorithm);
Narumol Prangnawaratbfaee6b2021-05-24 18:50:24 +0100148 void ParsePrelu(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan66dedc72019-12-10 16:32:07 +0000149 void ParseQuantize(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagana2747482021-02-09 10:28:54 +0000150 void ParseReduce(size_t subgraphIndex, size_t operatorIndex, armnn::ReduceOperation reduceOperation);
151 void ParseReduceMax(size_t subgraphIndex, size_t operatorIndex);
152 void ParseReduceMin(size_t subgraphIndex, size_t operatorIndex);
Teresa Charlin4e3e8312021-08-05 12:34:37 +0100153 void ParseReduceProd(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan58f39192018-09-17 14:14:39 +0100154 void ParseRelu(size_t subgraphIndex, size_t operatorIndex);
155 void ParseRelu6(size_t subgraphIndex, size_t operatorIndex);
Sadikb94967b2018-09-19 15:30:00 +0100156 void ParseReshape(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagana3b31f02019-12-05 09:08:53 +0000157 void ParseResize(size_t subgraphIndex, size_t operatorIndex, armnn::ResizeMethod resizeMethod);
Bruno Goncalves3f58ddb2019-02-07 18:40:11 -0200158 void ParseResizeBilinear(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagana3b31f02019-12-05 09:08:53 +0000159 void ParseResizeNearestNeighbor(size_t subgraphIndex, size_t operatorIndex);
Matthew Sloyaned7fce42021-04-15 20:46:24 +0100160 void ParseRsqrt(size_t subgraphIndex, size_t operatorIndex);
Keith Davis0176fd82021-06-01 17:36:32 +0100161 void ParseShape(size_t subgraphIndex, size_t operatorIndex);
josh minorba424d22019-11-13 10:55:17 -0600162 void ParseSlice(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan479045b2018-10-01 11:51:37 +0100163 void ParseSoftmax(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalvesbaded142019-02-08 19:02:48 -0200164 void ParseSpaceToBatchND(size_t subgraphIndex, size_t operatorIndex);
Nina Drozd200e3802019-04-15 09:47:39 +0100165 void ParseSplit(size_t subgraphIndex, size_t operatorIndex);
Derek Lambertif0176992020-04-28 13:37:49 +0100166 void ParseSplitV(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan479045b2018-10-01 11:51:37 +0100167 void ParseSqueeze(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalves451d95b2019-02-12 22:59:22 -0200168 void ParseStridedSlice(size_t subgraphIndex, size_t operatorIndex);
Bruno Goncalvesbbeae262019-02-07 18:37:39 -0200169 void ParseSub(size_t subgraphIndex, size_t operatorIndex);
Sadik Armagan0c3ea5b2021-02-03 09:29:30 +0000170 void ParseSum(size_t subgraphIndex, size_t operatorIndex);
Nina Drozd99851762019-04-09 09:37:38 +0100171 void ParseTanH(size_t subgraphIndex, size_t operatorIndex);
Keith Davis4cd29a02019-09-09 14:49:20 +0100172 void ParseTranspose(size_t subgraphIndex, size_t operatorIndex);
Matthew Jackson74bf7da2019-08-16 16:51:42 +0100173 void ParseTransposeConv(size_t subgraphIndex, size_t operatorIndex);
Nina Drozd200e3802019-04-15 09:47:39 +0100174 void ParseUnpack(size_t subgraphIndex, size_t operatorIndex);
Nattapat Chaimanowongb66504b2018-10-17 15:19:14 +0100175
telsoa01c577f2c2018-08-31 09:22:23 +0100176 void RegisterProducerOfTensor(size_t subgraphIndex, size_t tensorIndex, armnn::IOutputSlot* slot);
177 void RegisterConsumerOfTensor(size_t subgraphIndex, size_t tensorIndex, armnn::IInputSlot* slot);
178 void RegisterInputSlots(size_t subgraphIndex,
179 size_t operatorIndex,
180 armnn::IConnectableLayer* layer,
Finn Williamsd4fa5452021-03-01 12:31:41 +0000181 const std::vector<unsigned int>& tensorIndexes,
182 unsigned int startingSlotIndex = 0);
telsoa01c577f2c2018-08-31 09:22:23 +0100183 void RegisterOutputSlots(size_t subgraphIndex,
184 size_t operatorIndex,
185 armnn::IConnectableLayer* layer,
186 const std::vector<unsigned int>& tensorIndexes);
187
188 void SetupInputLayers(size_t subgraphIndex);
189 void SetupOutputLayers(size_t subgraphIndex);
Bruno Goncalves3d7efe92018-12-27 14:21:43 -0200190 void SetupConstantLayers(size_t subgraphIndex);
telsoa01c577f2c2018-08-31 09:22:23 +0100191
192 void ResetParser();
193
Bruno Goncalves9c761a62018-12-27 14:20:35 -0200194 void AddBroadcastReshapeLayer(size_t subgraphIndex,
195 size_t operatorIndex,
196 armnn::IConnectableLayer* layer);
197
telsoa01c577f2c2018-08-31 09:22:23 +0100198 /// Attach an activation layer to the one passed as a parameter
Sadik Armagan58f39192018-09-17 14:14:39 +0100199 armnn::IConnectableLayer* AddFusedActivationLayer(armnn::IConnectableLayer* layer,
200 unsigned int outputSlot,
201 tflite::ActivationFunctionType activationType);
telsoa01c577f2c2018-08-31 09:22:23 +0100202
203 // SupportedDataStorage's purpose is to hold data till we pass over to the network.
204 // We don't care about the content, and we want a single datatype to simplify the code.
205 struct SupportedDataStorage
206 {
Matteo Martincigh747ef822018-12-18 09:26:39 +0000207 public:
208 // Convenience constructors
209 SupportedDataStorage(std::unique_ptr<float[]>&& data);
210 SupportedDataStorage(std::unique_ptr<uint8_t[]>&& data);
Keith Davisd305e1a2020-01-22 11:57:54 +0000211 SupportedDataStorage(std::unique_ptr<int8_t[]>&& data);
Matteo Martincigh747ef822018-12-18 09:26:39 +0000212 SupportedDataStorage(std::unique_ptr<int32_t[]>&& data);
telsoa01c577f2c2018-08-31 09:22:23 +0100213
Matteo Martincigh747ef822018-12-18 09:26:39 +0000214 private:
215 // Pointers to the data buffers
216 std::unique_ptr<float[]> m_FloatData;
217 std::unique_ptr<uint8_t[]> m_Uint8Data;
Keith Davisd305e1a2020-01-22 11:57:54 +0000218 std::unique_ptr<int8_t[]> m_Int8Data;
Matteo Martincigh747ef822018-12-18 09:26:39 +0000219 std::unique_ptr<int32_t[]> m_Int32Data;
telsoa01c577f2c2018-08-31 09:22:23 +0100220 };
221
Finn Williamsd4fa5452021-03-01 12:31:41 +0000222 bool IsConstTensor(TensorRawPtr tensorPtr);
223 armnn::ConstTensor CreateConstTensorNonPermuted(TensorRawPtr tensorPtr,
224 armnn::TensorInfo& tensorInfo);
225 std::pair<armnn::ConstTensor, SupportedDataStorage>
226 CreateConstTensorPermuted(TensorRawPtr tensorPtr,
227 armnn::TensorInfo& tensorInfo,
228 armnn::Optional<armnn::PermutationVector&> permutationVector);
Matteo Martincigh747ef822018-12-18 09:26:39 +0000229
230 template<typename T>
Kevin May7d96b162021-02-03 17:38:41 +0000231 std::pair<armnn::ConstTensor, TfLiteParserImpl::SupportedDataStorage>
232 CreateConstTensorAndStoreData(TfLiteParserImpl::BufferRawPtr bufferPtr,
233 TfLiteParserImpl::TensorRawPtr tensorPtr,
Matteo Martincigh747ef822018-12-18 09:26:39 +0000234 armnn::TensorInfo& tensorInfo,
235 armnn::Optional<armnn::PermutationVector&> permutationVector);
236
Aron Virginas-Tarc975f922019-10-23 17:38:17 +0100237 // Settings for configuring the TfLiteParser
238 armnn::Optional<ITfLiteParser::TfLiteParserOptions> m_Options;
239
telsoa01c577f2c2018-08-31 09:22:23 +0100240 /// The network we're building. Gets cleared after it is passed to the user
241 armnn::INetworkPtr m_Network;
telsoa01c577f2c2018-08-31 09:22:23 +0100242 ModelPtr m_Model;
243
Aron Virginas-Tarc975f922019-10-23 17:38:17 +0100244 std::vector<OperatorParsingFunction> m_ParserFunctions;
245 std::unordered_map<std::string, OperatorParsingFunction> m_CustomParserFunctions;
246
telsoa01c577f2c2018-08-31 09:22:23 +0100247 /// A mapping of an output slot to each of the input slots it should be connected to
248 /// The outputSlot is from the layer that creates this tensor as one of its ouputs
249 /// The inputSlots are from the layers that use this tensor as one of their inputs
250 struct TensorSlots
251 {
252 armnn::IOutputSlot* outputSlot;
253 std::vector<armnn::IInputSlot*> inputSlots;
254
255 TensorSlots() : outputSlot(nullptr) { }
256 };
257 typedef std::vector<TensorSlots> TensorConnections;
258 /// Connections for tensors in each subgraph
259 /// The first index is the subgraph ID, the second index is the tensor ID
260 std::vector<TensorConnections> m_SubgraphConnections;
Narumol Prangnawarat4628d052019-02-25 17:26:05 +0000261
262 /// This is used in case that the model does not speciry the output.
263 /// The shape can be calculated from the options.
264 std::vector<std::vector<unsigned int>> m_OverridenOutputShapes;
telsoa01c577f2c2018-08-31 09:22:23 +0100265};
266
267}