blob: 3fd81ff973259acec12ff878ff72d4d8048d43d7 [file] [log] [blame]
//
// Copyright © 2017-2024 Arm Ltd and Contributors. All rights reserved.
// SPDX-License-Identifier: MIT
//
#include "TfLiteParser.hpp"
#include "armnnTfLiteParser/Version.hpp"
#include "armnn/LstmParams.hpp"
#include <armnn/BackendOptions.hpp>
#include <armnn/Descriptors.hpp>
#include <armnn/Exceptions.hpp>
#include <armnn/Logging.hpp>
#include <armnn/Tensor.hpp>
#include <armnnUtils/TensorUtils.hpp>
#include <armnn/TypesUtils.hpp>
#include <armnn/utility/Assert.hpp>
#include <armnn/utility/IgnoreUnused.hpp>
#include <armnn/utility/NumericCast.hpp>
// armnnUtils:
#include <armnnUtils/Permute.hpp>
#include <armnnUtils/Filesystem.hpp>
#include <ParserHelper.hpp>
#include <VerificationHelpers.hpp>
// The generated code based on the Tf Lite schema:
#include <schema_generated.h>
#include <flatbuffers/flexbuffers.h>
#include <fmt/format.h>
#include <algorithm>
#include <iostream>
#include <limits>
#include <numeric>
#define ARMNN_THROW_PARSE_EXCEPTION(msg) \
{ \
throw armnn::ParseException( static_cast<const std::stringstream&>( std::stringstream() << msg \
<< ": " \
<< CHECK_LOCATION().AsString()).str()); \
}
using namespace armnn;
using armnn::CheckLocation;
namespace armnnTfLiteParser
{
ITfLiteParser::ITfLiteParser(const armnn::Optional<TfLiteParserOptions>& options) :
pTfLiteParserImpl(new TfLiteParserImpl(options)) {}
ITfLiteParser::~ITfLiteParser() = default;
ITfLiteParser* ITfLiteParser::CreateRaw(const armnn::Optional<TfLiteParserOptions>& options)
{
return new ITfLiteParser(options);
}
ITfLiteParserPtr ITfLiteParser::Create(const armnn::Optional<TfLiteParserOptions>& options)
{
return ITfLiteParserPtr(CreateRaw(options), &ITfLiteParser::Destroy);
}
void ITfLiteParser::Destroy(ITfLiteParser* parser)
{
delete parser;
}
armnn::INetworkPtr ITfLiteParser::CreateNetworkFromBinaryFile(const char* graphFile)
{
return pTfLiteParserImpl->CreateNetworkFromBinaryFile(graphFile);
}
armnn::INetworkPtr ITfLiteParser::CreateNetworkFromBinary(const std::vector<uint8_t>& binaryContent)
{
return pTfLiteParserImpl->CreateNetworkFromBinary(binaryContent);
}
BindingPointInfo ITfLiteParser::GetNetworkInputBindingInfo(size_t subgraphId,
const std::string& name) const
{
return pTfLiteParserImpl->GetNetworkInputBindingInfo(subgraphId, name);
}
BindingPointInfo ITfLiteParser::GetNetworkOutputBindingInfo(size_t subgraphId,
const std::string& name) const
{
return pTfLiteParserImpl->GetNetworkOutputBindingInfo(subgraphId, name);
}
size_t ITfLiteParser::GetSubgraphCount() const
{
return pTfLiteParserImpl->GetSubgraphCount();
}
std::vector<std::string> ITfLiteParser::GetSubgraphInputTensorNames(size_t subgraphId) const
{
return pTfLiteParserImpl->GetSubgraphInputTensorNames(subgraphId);
}
std::vector<std::string> ITfLiteParser::GetSubgraphOutputTensorNames(size_t subgraphId) const
{
return pTfLiteParserImpl->GetSubgraphOutputTensorNames(subgraphId);
}
namespace
{
const uint32_t VIRTUAL_OPERATOR_ID = std::numeric_limits<uint32_t>::max();
void CheckSubgraph(const TfLiteParserImpl::ModelPtr& model,
size_t subgraphIndex,
const CheckLocation& location)
{
if (model.get() == nullptr)
{
throw ParseException(
fmt::format("{} was called with invalid (null) model. "
"Possible reason is that the model is not yet loaded and Unpack(ed). "
"subgraph:{} at {}",
location.m_Function,
subgraphIndex,
location.FileLine()));
}
else if (subgraphIndex >= model->subgraphs.size())
{
throw ParseException(
fmt::format("{} was called with an invalid subgraph index. "
"subgraph:{} at {}",
location.m_Function,
subgraphIndex,
location.FileLine()));
}
}
#define CHECK_SUBGRAPH(MODEL, SUBGRAPH_INDEX) \
CheckSubgraph(MODEL, SUBGRAPH_INDEX, CHECK_LOCATION())
void CheckModel(const TfLiteParserImpl::ModelPtr& model,
size_t subgraphIndex,
size_t operatorIndex,
const CheckLocation& location)
{
if (model.get() == nullptr)
{
throw ParseException(
fmt::format("{} was called with invalid (null) model. "
"Possible reason is that the model is not yet loaded and Unpack(ed). "
"subgraph:{} operator:{} at {}",
location.m_Function,
subgraphIndex,
operatorIndex,
location.FileLine()));
}
else if (subgraphIndex >= model->subgraphs.size())
{
throw ParseException(
fmt::format("{} was called with an invalid subgraph index. "
"subgraph:{} operator:{} at {}",
location.m_Function,
subgraphIndex,
operatorIndex,
location.FileLine()));
}
else if (operatorIndex >= model->subgraphs[subgraphIndex]->operators.size() &&
operatorIndex != VIRTUAL_OPERATOR_ID)
{
throw ParseException(
fmt::format("{} was called with an invalid operator index. "
"subgraph:{} operator:{} at {}",
location.m_Function,
subgraphIndex,
operatorIndex,
location.FileLine()));
}
}
#define CHECK_MODEL(MODEL, SUBGRAPH_INDEX, OPERATOR_INDEX) \
CheckModel(MODEL, SUBGRAPH_INDEX, OPERATOR_INDEX, CHECK_LOCATION())
void CheckTensor(const TfLiteParserImpl::ModelPtr& model,
size_t subgraphIndex,
size_t tensorIndex,
const CheckLocation& location)
{
// the tensor index is the only one to check here
if (tensorIndex >= model->subgraphs[subgraphIndex]->tensors.size())
{
throw ParseException(
fmt::format("{} was called with an invalid tensor index. "
"subgraph:{} tensor:{} at {}",
location.m_Function,
subgraphIndex,
tensorIndex,
location.FileLine()));
}
}
#define CHECK_TENSOR(MODEL, SUBGRAPH_INDEX, TENSOR_INDEX) \
CheckTensor(MODEL, SUBGRAPH_INDEX, TENSOR_INDEX, CHECK_LOCATION())
void CheckTensorPtr(TfLiteParserImpl::TensorRawPtr rawPtr,
const CheckLocation& location)
{
if (rawPtr == nullptr)
{
throw ParseException(
fmt::format("{} was called with a null tensor pointer at {}", location.m_Function, location.FileLine()));
}
}
#define CHECK_TENSOR_PTR(TENSOR_PTR) \
CheckTensorPtr(TENSOR_PTR, CHECK_LOCATION())
void CheckBuffer(const TfLiteParserImpl::ModelPtr& model,
size_t bufferIndex,
const CheckLocation& location)
{
if (model.get() == nullptr)
{
throw ParseException(
fmt::format("{} was called with invalid (null) model. "
"Possible reason is that the model is not yet loaded and Unpack(ed). "
"buffer:{} at {}",
location.m_Function,
bufferIndex,
location.FileLine()));
}
else if (bufferIndex >= model->buffers.size())
{
throw ParseException(
fmt::format("{} was called with an invalid buffer index. "
"buffer index:{} at {}",
location.m_Function,
bufferIndex,
location.FileLine()));
}
else if (model->buffers[bufferIndex].get() == nullptr)
{
throw ParseException(
fmt::format("The buffer #{} is null. {}",
bufferIndex,
location.AsString()));
}
}
#define CHECK_BUFFER(MODEL, BUFFER_INDEX) \
CheckBuffer(MODEL, BUFFER_INDEX, CHECK_LOCATION())
void CheckBufferSize(TfLiteParserImpl::BufferRawPtr bufferPtr,
const armnn::TensorInfo& tensorInfo,
uint32_t bufferId,
const CheckLocation& location)
{
if (bufferPtr == nullptr)
{
throw ParseException(
fmt::format("BufferPtr is null for buffer:{}. {}",
bufferId,
location.AsString()));
}
else if(tensorInfo.GetNumElements() > bufferPtr->data.size() ||
tensorInfo.GetNumBytes() > bufferPtr->data.size())
{
std::stringstream ss;
ss << "Buffer #" << bufferId << " has " << bufferPtr->data.size() << " bytes. "
<< "For tensor: " << tensorInfo.GetShape()
<< " expecting: " << tensorInfo.GetNumBytes() << " bytes and "
<< tensorInfo.GetNumElements() << " elements. " << location.AsString();
throw ParseException(ss.str());
}
}
tflite::BuiltinOperator GetOpCode(const TfLiteParserImpl::ModelPtr& model, size_t subgraphIndex, size_t operatorIndex)
{
const auto& operatorPtr = model->subgraphs[subgraphIndex]->operators[operatorIndex];
auto opcodeIndex = operatorPtr->opcode_index;
// work around the introduction of the deprecated_builtin_code introduced in 2.4 in a backwards compatible manner
#if defined(ARMNN_POST_TFLITE_2_3)
auto opcode = std::max(model->operator_codes[opcodeIndex]->builtin_code,
static_cast<tflite::BuiltinOperator>(model->operator_codes[opcodeIndex]->deprecated_builtin_code));
#else
auto opcode = model->operator_codes[opcodeIndex]->builtin_code;
#endif
return opcode;
}
std::vector<unsigned int> GetUIntBuffer(armnn::TensorInfo info,
const TfLiteParserImpl::ModelPtr& model,
size_t bufferIndex)
{
TfLiteParserImpl::BufferRawPtr bufferPtr = TfLiteParserImpl::GetBuffer(model, bufferIndex);
std::vector<unsigned int> buffer(info.GetNumElements());
if (info.GetDataType() == DataType::Signed32)
{
::memcpy(buffer.data(), bufferPtr->data.data(), bufferPtr->data.size());
}
else if (info.GetDataType() == DataType::Signed64)
{
std::vector<uint64_t> uint64Buffer(info.GetNumElements());
::memcpy(uint64Buffer.data(), bufferPtr->data.data(), bufferPtr->data.size());
buffer.assign(std::begin(uint64Buffer), std::end(uint64Buffer));
}
else
{
CheckLocation location = CHECK_LOCATION();
throw ParseException(
fmt::format("Unsupported data type for uint buffer {}, only Signed 32 or Signed 64 are supported. {}",
GetDataTypeName(info.GetDataType()),
location.AsString()));
}
return buffer;
}
#define CHECK_BUFFER_SIZE(BUFFER_PTR, TENSOR_INFO, BUFFER_ID) \
CheckBufferSize(BUFFER_PTR, TENSOR_INFO, BUFFER_ID, CHECK_LOCATION())
bool IsActivationSupported(tflite::ActivationFunctionType activationType)
{
switch(activationType)
{
case tflite::ActivationFunctionType_NONE:
case tflite::ActivationFunctionType_RELU:
case tflite::ActivationFunctionType_RELU6:
case tflite::ActivationFunctionType_TANH:
{
return true;
}
default:
{
return false;
}
}
}
#define CHECK_SUPPORTED_FUSED_ACTIVATION(OPTION, SUBGRAPH_INDEX, OPERATOR_INDEX) \
do { \
if (IsActivationSupported(OPTION->fused_activation_function) == false) \
{ \
throw ParseException( \
fmt::format("TfLite parser doesn't support fused activation: " \
"{}/{} in {} subgraph:{} operator:{} at {}", \
OPTION->fused_activation_function, \
tflite::EnumNameActivationFunctionType(\
OPTION->fused_activation_function), \
__func__, \
SUBGRAPH_INDEX, \
OPERATOR_INDEX, \
CHECK_LOCATION().FileLine())); \
} \
} while(false)
std::vector<unsigned int> AsUnsignedVector(const std::vector<int32_t>& in)
{
std::vector<unsigned int> result;
result.reserve(in.size());
for (auto& i : in)
{
// If the location of the input data is -1 then the input should be ignored.
if (i == -1)
{
continue;
}
result.push_back(CHECKED_NON_NEGATIVE(i));
}
return result;
}
bool IsOptionalOperandPresent(int input)
{
return (input >= 0);
}
void CalcPadding(uint32_t inputSize,
uint32_t filterSize,
uint32_t stride,
uint32_t dilation,
uint32_t& paddingFront,
uint32_t& paddingBack,
tflite::Padding padding)
{
paddingFront = 0;
paddingBack = 0;
if (padding == tflite::Padding_SAME)
{
uint32_t outputSize = (inputSize + stride - 1) / stride;
uint32_t dilatedSize = filterSize + (dilation - 1) * (filterSize - 1);
uint32_t temp = (outputSize - 1) * stride + dilatedSize;
if (temp > inputSize)
{
paddingFront = (temp - inputSize) / 2;
paddingBack = (temp - inputSize) - paddingFront;
}
}
}
// Function that calculates explicit padding when the output shape is known.
// At the moment the output is only given as an input parameter in Transpose Convolution,
// not in Convolution and Depthwise Convolution
void CalcPadding(uint32_t inputSize,
uint32_t filterSize,
uint32_t stride,
uint32_t dilation,
uint32_t& paddingFront,
uint32_t& paddingBack,
tflite::Padding padding,
uint32_t outputSize)
{
IgnoreUnused(dilation);
paddingFront = 0;
paddingBack = 0;
if (padding == tflite::Padding_SAME)
{
uint32_t totalPadding = (inputSize - 1) * stride + filterSize - outputSize;
paddingFront = totalPadding / 2;
paddingBack = totalPadding - paddingFront;
}
}
armnn::TensorInfo ToTensorInfo(TfLiteParserImpl::TensorRawPtr tensorPtr,
const std::vector<unsigned int>& shape,
const bool outputTensor = false)
{
armnn::DataType type;
CHECK_TENSOR_PTR(tensorPtr);
switch (tensorPtr->type)
{
case tflite::TensorType_UINT8:
type = armnn::DataType::QAsymmU8;
break;
case tflite::TensorType_FLOAT32:
type = armnn::DataType::Float32;
break;
case tflite::TensorType_FLOAT16:
type = armnn::DataType::Float16;
break;
case tflite::TensorType_INT8:
if (tensorPtr->quantization->zero_point.size() == 1)
{
// Per-tensor
type = armnn::DataType::QAsymmS8;
}
else
{
// Per-channel
type = armnn::DataType::QSymmS8;
}
break;
case tflite::TensorType_INT16:
type = armnn::DataType::QSymmS16;
break;
case tflite::TensorType_INT32:
type = armnn::DataType::Signed32;
break;
case tflite::TensorType_INT64:
type = armnn::DataType::Signed64;
break;
case tflite::TensorType_BOOL:
type = armnn::DataType::Boolean;
break;
default:
{
CheckLocation location = CHECK_LOCATION();
throw ParseException(
fmt::format("Unsupported data type {} = {} for tensor: {}. {}",
tensorPtr->type,
tflite::EnumNameTensorType(tensorPtr->type),
tensorPtr->name,
location.AsString()));
}
}
TensorShape tensorShape;
std::vector<unsigned int> safeShape = shape;
if (shape.size() == 0)
{
safeShape.push_back(1);
}
if (!outputTensor)
{
tensorShape = TensorShape(armnn::numeric_cast<unsigned int>(safeShape.size()), safeShape.data());
}
else
{
size_t shapeSignatureSize = tensorPtr->shape_signature.size();
// If a shape signature exists we will use that to infer dynamic tensors
if (shapeSignatureSize != 0)
{
// If the shape is incompatible with the shape signature override the shape
if (shapeSignatureSize != shape.size())
{
safeShape = {};
for (unsigned int i = 0; i < shapeSignatureSize; ++i)
{
unsigned int dim = tensorPtr->shape_signature[i] > -1 ?
static_cast<unsigned int>(tensorPtr->shape_signature[i]) : 0;
safeShape.push_back(dim);
}
}
std::unique_ptr<bool[]> dimMask = std::make_unique<bool[]>(tensorPtr->shape_signature.size());
bool batchOnly = true;
for (unsigned int i = 0; i < tensorPtr->shape_signature.size(); ++i)
{
dimMask[i] = tensorPtr->shape_signature[i] != -1;
if (i > 0 && !dimMask[i])
{
batchOnly = false;
}
}
if (batchOnly)
{
dimMask[0] = true;
}
tensorShape = TensorShape(static_cast<unsigned int>(safeShape.size()), safeShape.data(), dimMask.get());
}
// If there is no shape signature treat the tensor as dynamic if the shape has a size of zero
else if (shape.size() == 0)
{
tensorShape = TensorShape(1, false);
}
else
{
tensorShape = TensorShape(armnn::numeric_cast<unsigned int>(shape.size()), shape.data());
}
}
float quantizationScale = 1.0f;
int32_t quantizationOffset = 0;
if (tensorPtr->quantization.get())
{
if (tensorPtr->quantization->scale.size() <= 1)
{
CHECK_VALID_SIZE(tensorPtr->quantization->zero_point.size(), 0, 1);
CHECK_VALID_SIZE(tensorPtr->quantization->zero_point.size(), 0, 1);
if (tensorPtr->quantization->scale.size() == 1)
{
quantizationScale = tensorPtr->quantization->scale[0];
}
if (tensorPtr->quantization->zero_point.size() == 1)
{
// NOTE: we lose precision here when converting from 64 bit to 32
// but this is what we support at the moment in ArmNN
quantizationOffset = armnn::numeric_cast<int32_t>(tensorPtr->quantization->zero_point[0]);
}
armnn::TensorInfo result(tensorShape,
type,
quantizationScale,
quantizationOffset);
return result;
}
else
{
std::vector<float> quantizationScales;
std::vector<int32_t> quantizationOffsets;
// Scale
std::copy(tensorPtr->quantization->scale.begin(),
tensorPtr->quantization->scale.end(),
std::back_inserter(quantizationScales));
// QSymmS8 Per-axis
armnn::TensorInfo result(tensorShape,
type,
quantizationScales,
armnn::numeric_cast<unsigned int>(tensorPtr->quantization->quantized_dimension));
return result;
}
}
else
{
armnn::TensorInfo result(tensorShape,
type,
quantizationScale,
quantizationOffset);
return result;
}
}
armnn::TensorInfo ToTensorInfo(TfLiteParserImpl::TensorRawPtr tensorPtr,
const bool outputTensor = false)
{
auto const& dimensions = AsUnsignedVector(tensorPtr->shape);
return ToTensorInfo(tensorPtr, dimensions, outputTensor);
}
template<typename T>
std::pair<armnn::ConstTensor, std::unique_ptr<T[]>>
CreateConstTensorImpl(TfLiteParserImpl::BufferRawPtr bufferPtr,
TfLiteParserImpl::TensorRawPtr tensorPtr,
armnn::TensorInfo& tensorInfo,
armnn::Optional<armnn::PermutationVector&> permutationVector)
{
IgnoreUnused(tensorPtr);
if (!tensorPtr)
{
throw armnn::ParseException(fmt::format("Tensor pointer is null {}", CHECK_LOCATION().AsString()));
}
if (!bufferPtr)
{
throw armnn::ParseException(fmt::format("Buffer for buffer:{} is null", tensorPtr->buffer).c_str());
}
std::unique_ptr<T[]> data(new T[tensorInfo.GetNumElements()]);
if (permutationVector.has_value() && permutationVector.value().GetSize() > 0)
{
tensorInfo = armnnUtils::Permuted(tensorInfo, permutationVector.value());
armnnUtils::Permute(tensorInfo.GetShape(), permutationVector.value(),
reinterpret_cast<const T*>(bufferPtr->data.data()), data.get(), sizeof(T));
}
else
{
::memcpy(data.get(), bufferPtr->data.data(), tensorInfo.GetNumBytes());
}
// Make sure isConstant flag is set.
tensorInfo.SetConstant();
return std::make_pair(ConstTensor(tensorInfo, data.get()), std::move(data));
}
armnn::LayerBindingId GenerateLayerBindingId(size_t subgraphIndex, size_t tensorIndex)
{
// generate the binding id by shifting the tensor id by 8 bit
// and add the subgraph id, which allows 256 subgraphs
return static_cast<armnn::LayerBindingId>((tensorIndex<<8)+subgraphIndex);
}
bool CheckShape(const armnn::TensorShape& actual, const std::vector<int32_t>& expected)
{
const unsigned int actualSize = actual.GetNumDimensions();
if (actualSize != expected.size())
{
return false;
}
for (unsigned int i = 0u; i < actualSize; i++)
{
if (expected[i] < 0 ||
actual[i] != static_cast<unsigned int>(expected[i]))
{
return false;
}
}
return true;
}
bool CheckShape(const armnn::TensorShape& actual, const armnn::TensorShape& expected)
{
std::vector<int32_t> expectedVec;
for (uint32_t i = 0; i < expected.GetNumDimensions(); i++)
{
expectedVec.push_back(expected[i]);
}
return CheckShape(actual, expectedVec);
}
void CheckMatchingQuantization(const TensorInfo& first,
const TensorInfo& second,
const std::string& descName,
std::string const& firstName,
std::string const& secondName)
{
if (!first.IsQuantized() ||
!second.IsQuantized())
{
// Not a quantized type, ignore the validation
return;
}
DataType firstDataType = first.GetDataType();
DataType secondDataType = second.GetDataType();
if (firstDataType != secondDataType)
{
throw InvalidArgumentException(descName + ": " + firstName + " and " + secondName +
" must be of the same quantized type, " +
firstName + " is " + GetDataTypeName(firstDataType) + ", " +
secondName + " is " + GetDataTypeName(secondDataType));
}
if (!first.IsTypeSpaceMatch(second))
{
throw InvalidArgumentException(descName + ": " + firstName + " and " + secondName +
" must have the same quantization space, " +
firstName + " has offset " + std::to_string(first.GetQuantizationOffset()) +
" and scale " + std::to_string(first.GetQuantizationScale()) + ", " +
secondName + " has offset " + std::to_string(second.GetQuantizationOffset()) +
" and scale " + std::to_string(second.GetQuantizationScale()));
}
}
bool IsDynamic(TfLiteParserImpl::TensorRawPtr tensorPtr)
{
auto shape = tensorPtr->shape;
if (shape.empty())
{
return true;
}
auto shapeSig = tensorPtr->shape_signature;
if (shapeSig.empty())
{
return false;
}
for (unsigned int i = 0; i < shapeSig.size() ; ++i)
{
if (shapeSig[i] == -1)
{
return true;
}
}
return false;
}
} // <anonymous>
TfLiteParserImpl::TfLiteParserImpl(const Optional<ITfLiteParser::TfLiteParserOptions>& options)
: m_Options(options)
, m_Network(nullptr, nullptr)
, m_ParserFunctions(tflite::BuiltinOperator_MAX+1, &TfLiteParserImpl::ParseUnsupportedOperator)
{
// register supported operators
m_ParserFunctions[tflite::BuiltinOperator_ABS] = &TfLiteParserImpl::ParseAbs;
m_ParserFunctions[tflite::BuiltinOperator_ADD] = &TfLiteParserImpl::ParseAdd;
m_ParserFunctions[tflite::BuiltinOperator_ARG_MIN] = &TfLiteParserImpl::ParseArgMin;
m_ParserFunctions[tflite::BuiltinOperator_ARG_MAX] = &TfLiteParserImpl::ParseArgMax;
m_ParserFunctions[tflite::BuiltinOperator_AVERAGE_POOL_2D] = &TfLiteParserImpl::ParseAveragePool2D;
m_ParserFunctions[tflite::BuiltinOperator_BATCH_TO_SPACE_ND] = &TfLiteParserImpl::ParseBatchToSpaceND;
m_ParserFunctions[tflite::BuiltinOperator_BATCH_MATMUL] = &TfLiteParserImpl::ParseBatchMatMul;
m_ParserFunctions[tflite::BuiltinOperator_BROADCAST_TO] = &TfLiteParserImpl::ParseBroadcastTo;
m_ParserFunctions[tflite::BuiltinOperator_CEIL] = &TfLiteParserImpl::ParseCeil;
m_ParserFunctions[tflite::BuiltinOperator_CAST] = &TfLiteParserImpl::ParseCast;
m_ParserFunctions[tflite::BuiltinOperator_CONCATENATION] = &TfLiteParserImpl::ParseConcatenation;
m_ParserFunctions[tflite::BuiltinOperator_CONV_2D] = &TfLiteParserImpl::ParseConv2D;
// Conv3D support was added in TF 2.5, so for backwards compatibility a hash define is needed.
#if defined(ARMNN_POST_TFLITE_2_4)
m_ParserFunctions[tflite::BuiltinOperator_CONV_3D] = &TfLiteParserImpl::ParseConv3D;
#endif
m_ParserFunctions[tflite::BuiltinOperator_CUSTOM] = &TfLiteParserImpl::ParseCustomOperator;
m_ParserFunctions[tflite::BuiltinOperator_DEPTH_TO_SPACE] = &TfLiteParserImpl::ParseDepthToSpace;
m_ParserFunctions[tflite::BuiltinOperator_DEPTHWISE_CONV_2D] = &TfLiteParserImpl::ParseDepthwiseConv2D;
m_ParserFunctions[tflite::BuiltinOperator_DEQUANTIZE] = &TfLiteParserImpl::ParseDequantize;
m_ParserFunctions[tflite::BuiltinOperator_DIV] = &TfLiteParserImpl::ParseDiv;
m_ParserFunctions[tflite::BuiltinOperator_ELU] = &TfLiteParserImpl::ParseElu;
m_ParserFunctions[tflite::BuiltinOperator_EQUAL] = &TfLiteParserImpl::ParseEqual;
m_ParserFunctions[tflite::BuiltinOperator_EXP] = &TfLiteParserImpl::ParseExp;
m_ParserFunctions[tflite::BuiltinOperator_EXPAND_DIMS] = &TfLiteParserImpl::ParseExpandDims;
m_ParserFunctions[tflite::BuiltinOperator_FLOOR_DIV] = &TfLiteParserImpl::ParseFloorDiv;
m_ParserFunctions[tflite::BuiltinOperator_FULLY_CONNECTED] = &TfLiteParserImpl::ParseFullyConnected;
m_ParserFunctions[tflite::BuiltinOperator_GATHER] = &TfLiteParserImpl::ParseGather;
m_ParserFunctions[tflite::BuiltinOperator_GELU] = &TfLiteParserImpl::ParseGelu;
m_ParserFunctions[tflite::BuiltinOperator_GATHER_ND] = &TfLiteParserImpl::ParseGatherNd;
m_ParserFunctions[tflite::BuiltinOperator_GREATER] = &TfLiteParserImpl::ParseGreater;
m_ParserFunctions[tflite::BuiltinOperator_GREATER_EQUAL] = &TfLiteParserImpl::ParseGreaterOrEqual;
m_ParserFunctions[tflite::BuiltinOperator_HARD_SWISH] = &TfLiteParserImpl::ParseHardSwish;
m_ParserFunctions[tflite::BuiltinOperator_LEAKY_RELU] = &TfLiteParserImpl::ParseLeakyRelu;
m_ParserFunctions[tflite::BuiltinOperator_LESS] = &TfLiteParserImpl::ParseLess;
m_ParserFunctions[tflite::BuiltinOperator_LESS_EQUAL] = &TfLiteParserImpl::ParseLessOrEqual;
m_ParserFunctions[tflite::BuiltinOperator_LOCAL_RESPONSE_NORMALIZATION]
= &TfLiteParserImpl::ParseLocalResponseNormalization;
m_ParserFunctions[tflite::BuiltinOperator_LOG] = &TfLiteParserImpl::ParseLog;
m_ParserFunctions[tflite::BuiltinOperator_LOGICAL_NOT] = &TfLiteParserImpl::ParseLogicalNot;
m_ParserFunctions[tflite::BuiltinOperator_LOGISTIC] = &TfLiteParserImpl::ParseLogistic;
m_ParserFunctions[tflite::BuiltinOperator_LOG_SOFTMAX] = &TfLiteParserImpl::ParseLogSoftmax;
m_ParserFunctions[tflite::BuiltinOperator_L2_NORMALIZATION] = &TfLiteParserImpl::ParseL2Normalization;
m_ParserFunctions[tflite::BuiltinOperator_MAX_POOL_2D] = &TfLiteParserImpl::ParseMaxPool2D;
m_ParserFunctions[tflite::BuiltinOperator_MAXIMUM] = &TfLiteParserImpl::ParseMaximum;
m_ParserFunctions[tflite::BuiltinOperator_MEAN] = &TfLiteParserImpl::ParseMean;
m_ParserFunctions[tflite::BuiltinOperator_MINIMUM] = &TfLiteParserImpl::ParseMinimum;
m_ParserFunctions[tflite::BuiltinOperator_MIRROR_PAD] = &TfLiteParserImpl::ParseMirrorPad;
m_ParserFunctions[tflite::BuiltinOperator_MUL] = &TfLiteParserImpl::ParseMul;
m_ParserFunctions[tflite::BuiltinOperator_NEG] = &TfLiteParserImpl::ParseNeg;
m_ParserFunctions[tflite::BuiltinOperator_NOT_EQUAL] = &TfLiteParserImpl::ParseNotEqual;
m_ParserFunctions[tflite::BuiltinOperator_PACK] = &TfLiteParserImpl::ParsePack;
m_ParserFunctions[tflite::BuiltinOperator_PAD] = &TfLiteParserImpl::ParsePad;
m_ParserFunctions[tflite::BuiltinOperator_PADV2] = &TfLiteParserImpl::ParsePad;
m_ParserFunctions[tflite::BuiltinOperator_POW] = &TfLiteParserImpl::ParsePower;
m_ParserFunctions[tflite::BuiltinOperator_PRELU] = &TfLiteParserImpl::ParsePrelu;
m_ParserFunctions[tflite::BuiltinOperator_QUANTIZE] = &TfLiteParserImpl::ParseQuantize;
m_ParserFunctions[tflite::BuiltinOperator_RELU] = &TfLiteParserImpl::ParseRelu;
m_ParserFunctions[tflite::BuiltinOperator_RELU6] = &TfLiteParserImpl::ParseRelu6;
m_ParserFunctions[tflite::BuiltinOperator_REDUCE_MAX] = &TfLiteParserImpl::ParseReduceMax;
m_ParserFunctions[tflite::BuiltinOperator_REDUCE_MIN] = &TfLiteParserImpl::ParseReduceMin;
m_ParserFunctions[tflite::BuiltinOperator_REDUCE_PROD] = &TfLiteParserImpl::ParseReduceProd;
m_ParserFunctions[tflite::BuiltinOperator_RESHAPE] = &TfLiteParserImpl::ParseReshape;
m_ParserFunctions[tflite::BuiltinOperator_RESIZE_BILINEAR] = &TfLiteParserImpl::ParseResizeBilinear;
m_ParserFunctions[tflite::BuiltinOperator_RESIZE_NEAREST_NEIGHBOR] = &TfLiteParserImpl::ParseResizeNearestNeighbor;
m_ParserFunctions[tflite::BuiltinOperator_REVERSE_V2] = &TfLiteParserImpl::ParseReverseV2;
m_ParserFunctions[tflite::BuiltinOperator_RSQRT] = &TfLiteParserImpl::ParseRsqrt;
m_ParserFunctions[tflite::BuiltinOperator_SCATTER_ND] = &TfLiteParserImpl::ParseScatterNd;
m_ParserFunctions[tflite::BuiltinOperator_SQRT] = &TfLiteParserImpl::ParseSqrt;
m_ParserFunctions[tflite::BuiltinOperator_SHAPE] = &TfLiteParserImpl::ParseShape;
m_ParserFunctions[tflite::BuiltinOperator_SIN] = &TfLiteParserImpl::ParseSin;
m_ParserFunctions[tflite::BuiltinOperator_SLICE] = &TfLiteParserImpl::ParseSlice;
m_ParserFunctions[tflite::BuiltinOperator_SOFTMAX] = &TfLiteParserImpl::ParseSoftmax;
m_ParserFunctions[tflite::BuiltinOperator_SPACE_TO_BATCH_ND] = &TfLiteParserImpl::ParseSpaceToBatchND;
m_ParserFunctions[tflite::BuiltinOperator_SPACE_TO_DEPTH] = &TfLiteParserImpl::ParseSpaceToDepth;
m_ParserFunctions[tflite::BuiltinOperator_SPLIT] = &TfLiteParserImpl::ParseSplit;
m_ParserFunctions[tflite::BuiltinOperator_SPLIT_V] = &TfLiteParserImpl::ParseSplitV;
m_ParserFunctions[tflite::BuiltinOperator_SQUEEZE] = &TfLiteParserImpl::ParseSqueeze;
m_ParserFunctions[tflite::BuiltinOperator_SQUARE] = &TfLiteParserImpl::ParseSquare;
m_ParserFunctions[tflite::BuiltinOperator_SQUARED_DIFFERENCE] = &TfLiteParserImpl::ParseSquaredDifference;
m_ParserFunctions[tflite::BuiltinOperator_STRIDED_SLICE] = &TfLiteParserImpl::ParseStridedSlice;
m_ParserFunctions[tflite::BuiltinOperator_SUB] = &TfLiteParserImpl::ParseSub;
m_ParserFunctions[tflite::BuiltinOperator_SUM] = &TfLiteParserImpl::ParseSum;
m_ParserFunctions[tflite::BuiltinOperator_TANH] = &TfLiteParserImpl::ParseTanH;
m_ParserFunctions[tflite::BuiltinOperator_TILE] = &TfLiteParserImpl::ParseTile;
m_ParserFunctions[tflite::BuiltinOperator_TRANSPOSE] = &TfLiteParserImpl::ParseTranspose;
m_ParserFunctions[tflite::BuiltinOperator_TRANSPOSE_CONV] = &TfLiteParserImpl::ParseTransposeConv;
m_ParserFunctions[tflite::BuiltinOperator_UNIDIRECTIONAL_SEQUENCE_LSTM]
= &TfLiteParserImpl::ParseUnidirectionalSequenceLSTM;
m_ParserFunctions[tflite::BuiltinOperator_UNPACK] = &TfLiteParserImpl::ParseUnpack;
// register supported custom operators
m_CustomParserFunctions["TFLite_Detection_PostProcess"] = &TfLiteParserImpl::ParseDetectionPostProcess;
}
armnn::TensorInfo TfLiteParserImpl::InputTensorInfo(size_t subgraphIndex,
size_t operatorIndex,
int input)
{
const auto& subgraphPtr = m_Model->subgraphs[subgraphIndex];
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
uint32_t inputId = CHECKED_NON_NEGATIVE(operatorPtr->inputs[input]);
auto search = armnnTfLiteParser::TfLiteParserImpl::m_TensorInfos.find(inputId);
if (search != m_TensorInfos.end())
{
return m_TensorInfos[inputId];
}
else
{
auto tensorInfo = ::armnnTfLiteParser::ToTensorInfo(subgraphPtr->tensors[inputId].get());
m_TensorInfos.insert({ inputId, tensorInfo });
return tensorInfo;
}
}
armnn::TensorInfo TfLiteParserImpl::OutputTensorInfoFromInputs(size_t subgraphIndex,
size_t operatorIndex,
armnn::IConnectableLayer* layer,
int output,
std::vector<int> inputs)
{
const auto& subgraphPtr = m_Model->subgraphs[subgraphIndex];
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
uint32_t outputId = CHECKED_NON_NEGATIVE(operatorPtr->outputs[output]);
auto outputSearch = armnnTfLiteParser::TfLiteParserImpl::m_TensorInfos.find(outputId);
if (outputSearch != m_TensorInfos.end())
{
return m_TensorInfos[outputId];
}
const auto& outputTensorPtr = subgraphPtr->tensors[outputId].get();
TensorInfo tensor = ::armnnTfLiteParser::ToTensorInfo(outputTensorPtr, true);
if (IsDynamic(outputTensorPtr))
{
if (inputs.empty())
{
for (unsigned int i = 0; i < layer->GetNumInputSlots(); ++i)
{
inputs.emplace_back(i);
}
}
auto inputTensorIds = GetInputTensorIds(m_Model, subgraphIndex, operatorIndex);
std::vector<armnn::TensorShape> inputShapes;
for (unsigned int i = 0; i < inputs.size(); ++i)
{
uint32_t inputId = CHECKED_NON_NEGATIVE(operatorPtr->inputs[inputs[i]]);
auto search = armnnTfLiteParser::TfLiteParserImpl::m_TensorInfos.find(inputId);
if (search != m_TensorInfos.end())
{
auto &inputTensorInfo = m_TensorInfos[inputId];
inputShapes.push_back(inputTensorInfo.GetShape());
}
else
{
auto inputTensorInfo = ::armnnTfLiteParser::ToTensorInfo(subgraphPtr->tensors[inputId].get());
m_TensorInfos.insert({ inputId, inputTensorInfo});
inputShapes.push_back(inputTensorInfo.GetShape());
}
}
const auto outputShape = layer->InferOutputShapes(inputShapes)[output];
tensor.SetShape(outputShape);
}
m_TensorInfos.insert({ outputId, tensor});
return tensor;
}
armnn::TensorInfo TfLiteParserImpl::OutputTensorInfoFromShapes(size_t subgraphIndex,
size_t operatorIndex,
armnn::IConnectableLayer* layer,
int output,
std::vector<armnn::TensorShape> inputShapes)
{
const auto& subgraphPtr = m_Model->subgraphs[subgraphIndex];
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
uint32_t outputId = CHECKED_NON_NEGATIVE(operatorPtr->outputs[output]);
const auto& outputTensorPtr = subgraphPtr->tensors[outputId].get();
TensorInfo tensor = ::armnnTfLiteParser::ToTensorInfo(outputTensorPtr, true);
if (IsDynamic(outputTensorPtr))
{
const auto outputShape = layer->InferOutputShapes(inputShapes)[output];
tensor.SetShape(outputShape);
}
m_TensorInfos.insert({ outputId, tensor});
return tensor;
}
void TfLiteParserImpl::ResetParser()
{
m_Network = armnn::INetworkPtr(nullptr, nullptr);
m_Model = nullptr;
m_SubgraphConnections.clear();
m_OverriddenOutputShapes.clear();
m_ConstantsToDequantize.clear();
m_ConstantsToBeCreated.clear();
m_TensorInfos.clear();
}
INetworkPtr TfLiteParserImpl::CreateNetworkFromBinaryFile(const char* graphFile)
{
ResetParser();
m_Model = LoadModelFromFile(graphFile);
return CreateNetworkFromModel();
}
INetworkPtr TfLiteParserImpl::CreateNetworkFromBinary(const std::vector<uint8_t>& binaryContent)
{
ResetParser();
m_Model = LoadModelFromBinary(binaryContent.data(), binaryContent.size());
return CreateNetworkFromModel();
}
armnn::INetworkPtr TfLiteParserImpl::LoadModel(std::unique_ptr<tflite::ModelT> model)
{
ResetParser();
m_Model = std::move(model);
return CreateNetworkFromModel();
}
INetworkPtr TfLiteParserImpl::CreateNetworkFromModel()
{
using NetworkOptions = std::vector<BackendOptions>;
NetworkOptions networkOptions = {};
if (m_Options)
{
if (m_Options.value().m_InferAndValidate)
{
BackendOptions shapeInferenceMethodOption("ShapeInferenceMethod",
{
{ "InferAndValidate", true }
});
networkOptions.push_back(shapeInferenceMethodOption);
}
if (m_Options.value().m_AllowExpandedDims)
{
BackendOptions shapeInferenceMethodOption("AllowExpandedDims",
{
{ "AllowExpandedDims", true }
});
networkOptions.push_back(shapeInferenceMethodOption);
}
}
m_Network = INetwork::Create(networkOptions);
if (m_Model.get() == nullptr)
{
throw ParseException(fmt::format("Tflite Model pointer is null {}", CHECK_LOCATION().AsString()));
}
// Identify which subgraph we are going to parse. We only support one subgraph but there may be validation
// subgraphs still stored in the model. We'll ignore these. In the tflite code base they are identified by
// their name beginning with "VALIDATION:".
size_t subgraphIndex = 0;
uint8_t usableSubgraphs = 0;
for (size_t i = 0; i < m_Model->subgraphs.size(); i++)
{
if (m_Model->subgraphs[i]->name.rfind("VALIDATION:", 0) != 0)
{
usableSubgraphs++;
subgraphIndex = i;
}
}
if (usableSubgraphs > 1)
{
throw ParseException(
fmt::format("Current TfLite parser only supports 1 non validation subgraph. This model has: {} {}",
usableSubgraphs, CHECK_LOCATION().AsString()));
}
size_t operatorIndex = 0;
try
{
const SubgraphPtr& subgraph = m_Model->subgraphs[subgraphIndex];
SetupInputLayerTensorInfos(subgraphIndex);
SetupConstantLayerTensorInfos(subgraphIndex);
m_SubgraphConnections.emplace_back(subgraph->tensors.size());
for (const OperatorPtr& op : subgraph->operators)
{
const auto& opCodePtr = m_Model->operator_codes[op->opcode_index];
// work around the introduction of the deprecated_builtin_code introduced in 2.4 in a backwards compatible manner
#if defined(ARMNN_POST_TFLITE_2_3)
auto builtinCode = std::max(opCodePtr->builtin_code,
static_cast<tflite::BuiltinOperator>(opCodePtr->deprecated_builtin_code));
#else
auto builtinCode = opCodePtr->builtin_code;
#endif
if (builtinCode > tflite::BuiltinOperator_MAX)
{
throw ParseException(fmt::format("Operator code {} is out of range 0-{}. "
"subgraph:{} operator idx:{}. {}",
builtinCode, tflite::BuiltinOperator_MAX, subgraphIndex,
operatorIndex, CHECK_LOCATION().AsString()));
}
// lookup and call the parser function
auto& parserFunction = m_ParserFunctions[builtinCode];
(this->*parserFunction)(subgraphIndex, operatorIndex);
++operatorIndex;
}
SetupInputLayers(subgraphIndex);
SetupOutputLayers(subgraphIndex);
SetupConstantLayers(subgraphIndex);
}
catch (const ParseException& e)
{
std::stringstream errorString;
errorString << "Failed to parse operator #" << operatorIndex << " within subgraph #"
<< subgraphIndex << " error: " << e.what();
ARMNN_LOG(error) << errorString.str();
std::stringstream errors;
errors << errorString.str() << "\n";
throw ParseException(errors.str());
}
// establish the connections from the layer outputs to the inputs of the subsequent layers
for (subgraphIndex = 0; subgraphIndex < m_SubgraphConnections.size(); ++subgraphIndex)
{
for (size_t tensorIndex = 0; tensorIndex < m_SubgraphConnections[subgraphIndex].size(); ++tensorIndex)
{
if (m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot != nullptr)
{
for (size_t inputSlotIdx = 0;
inputSlotIdx < m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots.size();
++inputSlotIdx)
{
m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot->Connect(
*(m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots[inputSlotIdx]));
}
}
}
}
return std::move(m_Network);
}
bool TfLiteParserImpl::ShouldConstantTensorBeConverted(TfLiteParserImpl::TensorRawPtr tensorPtr,
armnn::DataType inputDataType,
armnn::DataType tensorDataType)
{
return (TfLiteParserImpl::IsConstTensor(tensorPtr) && inputDataType == DataType::Float32 &&
(tensorDataType == DataType::QAsymmU8 ||
tensorDataType == DataType::QAsymmS8 ||
tensorDataType == DataType::QSymmS8 ||
tensorDataType == DataType::Signed32 ||
tensorDataType == DataType::Signed64));
}
void TfLiteParserImpl::RegisterProducerOfTensor(size_t subgraphIndex,
size_t tensorIndex,
armnn::IOutputSlot* slot)
{
CHECK_TENSOR(m_Model, subgraphIndex, tensorIndex);
TensorSlots & tensorSlots = m_SubgraphConnections[subgraphIndex][tensorIndex];
if (slot->GetOwningIConnectableLayer().GetType() != LayerType::Constant)
{
// assuming there is only one producer for that tensor
if (tensorSlots.outputSlot != nullptr)
{
throw ParseException(fmt::format("Another layer has already registered itself as the producer of "
"subgraph:{} tensor:{} {}",
subgraphIndex,
tensorIndex,
CHECK_LOCATION().AsString()));
}
}
tensorSlots.outputSlot = slot;
}
void TfLiteParserImpl::RegisterConsumerOfTensor(size_t subgraphIndex,
size_t tensorIndex,
armnn::IInputSlot* slot)
{
CHECK_TENSOR(m_Model, subgraphIndex, tensorIndex);
TensorSlots& tensorSlots = m_SubgraphConnections[subgraphIndex][tensorIndex];
tensorSlots.inputSlots.push_back(slot);
}
void TfLiteParserImpl::ParseCustomOperator(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
// NOTE: By default we presume the custom operator is not supported
auto customParserFunction = &TfLiteParserImpl::ParseUnsupportedOperator;
// Identify custom code defined for custom operator
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto& customCode = m_Model->operator_codes[operatorPtr->opcode_index]->custom_code;
// Find parser function that corresponds to custom code (if any)
auto iterator = m_CustomParserFunctions.find(customCode);
if (iterator != m_CustomParserFunctions.end())
{
customParserFunction = iterator->second;
}
// Run parser function
(this->*customParserFunction)(subgraphIndex, operatorIndex);
}
void TfLiteParserImpl::ParseUnsupportedOperator(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
auto opcodeIndex = operatorPtr->opcode_index;
// work around the introduction of the deprecated_builtin_code introduced in 2.4 in a backwards compatible manner
#if defined(ARMNN_POST_TFLITE_2_3)
auto opcode = std::max(m_Model->operator_codes[opcodeIndex]->builtin_code,
static_cast<tflite::BuiltinOperator>(m_Model->operator_codes[opcodeIndex]->deprecated_builtin_code));
#else
auto opcode = m_Model->operator_codes[opcodeIndex]->builtin_code;
#endif
if (!m_Options || !m_Options.value().m_StandInLayerForUnsupported)
{
// Do not add StandInLayer, throw ParseException instead
throw ParseException(
fmt::format("Operator not supported. "
"subgraph:{} operator:{} "
"opcode_index:{} opcode:{} / {} {}",
subgraphIndex,
operatorIndex,
opcodeIndex,
opcode,
tflite::EnumNameBuiltinOperator(opcode),
CHECK_LOCATION().AsString()));
}
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
const unsigned int numInputs = armnn::numeric_cast<unsigned int>(inputs.size());
const unsigned int numOutputs = armnn::numeric_cast<unsigned int>(outputs.size());
StandInDescriptor descriptor(numInputs, numOutputs);
auto layerName = fmt::format("StandIn:{}:{}:{}", subgraphIndex, operatorIndex, opcode);
// Add a non-executable StandInLayer as a placeholder for any unsupported operator
IConnectableLayer* layer = m_Network->AddStandInLayer(descriptor, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
for (unsigned int i = 0u; i < numOutputs; ++i)
{
layer->GetOutputSlot(i).SetTensorInfo(ToTensorInfo(outputs[0], true));
}
auto inputTensorIds = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
auto outputTensorIds = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, inputTensorIds);
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIds);
}
void TfLiteParserImpl::ParseCast(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Cast:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddCastLayer(layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseConv2D(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsConv2DOptions();
CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
Convolution2dDescriptor desc;
inputs.size() == 3 ?
desc.m_BiasEnabled = true : desc.m_BiasEnabled = false;
desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
desc.m_DataLayout = armnn::DataLayout::NHWC;
desc.m_DilationX = CHECKED_NON_NEGATIVE(options->dilation_w_factor);
desc.m_DilationY = CHECKED_NON_NEGATIVE(options->dilation_h_factor);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo filterTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
// assuming input is NHWC
unsigned int inputHeight = inputTensorInfo.GetShape()[1];
unsigned int inputWidth = inputTensorInfo.GetShape()[2];
// assuming the filter is OHWI : Output, H, W, Input
// which is essentially the same as NHWC
unsigned int filterHeight = filterTensorInfo.GetShape()[1];
unsigned int filterWidth = filterTensorInfo.GetShape()[2];
CalcPadding(inputHeight, filterHeight, desc.m_StrideY,
desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, options->padding);
CalcPadding(inputWidth, filterWidth, desc.m_StrideX,
desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, options->padding);
// Add the first input and weights tensor to the registration list.
// The constant weights will be added by SetupConstantLayers.
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
std::vector<unsigned int> tensorIndexesToRegister = { inputTensorIndexes[0], inputTensorIndexes[1] };
auto layerName = fmt::format("Conv2D:{}:{}", subgraphIndex, operatorIndex);
armnn::IConnectableLayer* layer = m_Network->AddConvolution2dLayer(desc, layerName.c_str());
if (ShouldConstantTensorBeConverted(inputs[1], inputTensorInfo.GetDataType(), filterTensorInfo.GetDataType()))
{
m_ConstantsToDequantize.emplace_back(inputs[1]->buffer);
}
if (desc.m_BiasEnabled)
{
armnn::TensorInfo biasTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
// Add the biases input to the registration list, a constant layer will be added by SetupConstantLayers.
tensorIndexesToRegister.emplace_back(inputTensorIndexes[2]);
if (ShouldConstantTensorBeConverted(inputs[2], inputTensorInfo.GetDataType(), biasTensorInfo.GetDataType()))
{
m_ConstantsToDequantize.emplace_back(inputs[2]->buffer);
}
}
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
RegisterInputSlots(subgraphIndex, operatorIndex, layer, tensorIndexesToRegister);
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
// register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, { outputTensorIndexes[0] });
}
// Conv3D support was added in TF 2.5, so for backwards compatibility a hash define is needed.
#if defined(ARMNN_POST_TFLITE_2_4)
void TfLiteParserImpl::ParseConv3D(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsConv3DOptions();
CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
Convolution3dDescriptor desc;
desc.m_BiasEnabled = false;
desc.m_DataLayout = armnn::DataLayout::NDHWC;
desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
desc.m_StrideZ = CHECKED_NON_NEGATIVE(options->stride_d);
desc.m_DilationX = CHECKED_NON_NEGATIVE(options->dilation_w_factor);
desc.m_DilationY = CHECKED_NON_NEGATIVE(options->dilation_h_factor);
desc.m_DilationZ = CHECKED_NON_NEGATIVE(options->dilation_d_factor);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2, 3);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo filterTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
// Assuming input is NDHWC
unsigned int inputDepth = inputTensorInfo.GetShape()[1];
unsigned int inputHeight = inputTensorInfo.GetShape()[2];
unsigned int inputWidth = inputTensorInfo.GetShape()[3];
// Assuming the filter is DHWIO : Depth, Height, Width, OutputChannels, InputChannels
unsigned int filterDepth = filterTensorInfo.GetShape()[0];
unsigned int filterHeight = filterTensorInfo.GetShape()[1];
unsigned int filterWidth = filterTensorInfo.GetShape()[2];
CalcPadding(inputDepth, filterDepth, desc.m_StrideZ,
desc.m_DilationZ, desc.m_PadFront, desc.m_PadBack, options->padding);
CalcPadding(inputHeight, filterHeight, desc.m_StrideY,
desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, options->padding);
CalcPadding(inputWidth, filterWidth, desc.m_StrideX,
desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, options->padding);
auto filterTensorAndData = CreateConstTensorNonPermuted(inputs[1], filterTensorInfo, inputTensorInfo.GetDataType());
auto layerName = fmt::format("Conv3D:{}:{}", subgraphIndex, operatorIndex);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
// Add the first input and weights tensor to the registration list.
// The constant weights will be added by SetupConstantLayers.
std::vector<unsigned int> tensorIndexesToRegister = {inputTensorIndexes[0], inputTensorIndexes[1]};
if (inputs.size() == 3)
{
desc.m_BiasEnabled = true;
// Add the biases input to the registration list, a constant layer will be added by SetupConstantLayers.
tensorIndexesToRegister.emplace_back(inputTensorIndexes[2]);
}
armnn::IConnectableLayer* layer = m_Network->AddConvolution3dLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// Register the input connection slots for the layer, connections are made after all layers have been created
RegisterInputSlots(subgraphIndex, operatorIndex, layer, tensorIndexesToRegister);
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
// Register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
#endif
void TfLiteParserImpl::ParseDepthwiseConv2D(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsDepthwiseConv2DOptions();
CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
DepthwiseConvolution2dDescriptor desc;
desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
desc.m_DataLayout = armnn::DataLayout::NHWC;
CHECKED_NON_NEGATIVE(options->depth_multiplier);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2, 3);
if (inputs.size() == 3)
{
desc.m_BiasEnabled = true;
}
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
desc.m_DilationX = CHECKED_NON_NEGATIVE(options->dilation_w_factor);
desc.m_DilationY = CHECKED_NON_NEGATIVE(options->dilation_h_factor);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo filterTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
// Assuming input is NHWC
unsigned int inputHeight = inputTensorInfo.GetShape()[1];
unsigned int inputWidth = inputTensorInfo.GetShape()[2];
// TensorflowLite weights come in the format [1, H, W, I * M]
unsigned int filterHeight = filterTensorInfo.GetShape()[1];
unsigned int filterWidth = filterTensorInfo.GetShape()[2];
CalcPadding(inputHeight, filterHeight, desc.m_StrideY,
desc.m_DilationY, desc.m_PadTop, desc.m_PadBottom, options->padding);
CalcPadding(inputWidth, filterWidth, desc.m_StrideX,
desc.m_DilationX, desc.m_PadLeft, desc.m_PadRight, options->padding);
// ArmNN uses the same filter tensor layout at TfLite [1, H, W, O] no need for any permutation
auto layerName = fmt::format("DepthwiseConv2D:{}:{}", subgraphIndex, operatorIndex);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
// Add the first input and weights tensor to the registration list.
// The constant weights will be added by SetupConstantLayers.
std::vector<unsigned int> tensorIndexesToRegister = {inputTensorIndexes[0], inputTensorIndexes[1]};
armnn::IConnectableLayer* layer = m_Network->AddDepthwiseConvolution2dLayer(desc, layerName.c_str());
if (desc.m_BiasEnabled)
{
desc.m_BiasEnabled = true;
TensorInfo biasTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
// Add the biases input to the registration list, a constant layer will be added by SetupConstantLayers.
tensorIndexesToRegister.emplace_back(inputTensorIndexes[2]);
}
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
RegisterInputSlots(subgraphIndex, operatorIndex, layer, tensorIndexesToRegister);
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
// register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseDequantize(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Dequantize:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddDequantizeLayer(layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseExpandDims(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("ExpandDims:{}:{}", subgraphIndex, operatorIndex);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0], true);
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
armnn::TensorInfo axisTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
BufferRawPtr axisBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
if (axisBufferPtr == nullptr)
{
throw ParseException(fmt::format("{}: Operation has invalid inputs. Failed to read axis.",
CHECK_LOCATION().AsString()));
}
std::vector<int32_t> axisData(axisTensorInfo.GetNumElements());
::memcpy(axisData.data(), axisBufferPtr->data.data(), axisTensorInfo.GetNumBytes());
int32_t axis = axisData[0];
auto inputRank = static_cast<int32_t>(inputTensorInfo.GetShape().GetNumDimensions());
auto outputRank = inputRank + 1;
if((axis < -1 * outputRank) || (outputRank <= axis))
{
throw ParseException(fmt::format("{}: Axis {} is not within [-{}, {}) range.",
CHECK_LOCATION().AsString(), axis, outputRank, outputRank));
}
axis = axis < 0 ? (axis + outputRank) : axis;
std::vector<unsigned int> shape(static_cast<unsigned int>(outputRank));
unsigned int inputShapeIndex = 0;
for (unsigned int i = 0; i < static_cast<unsigned int>(outputRank); ++i)
{
if (i == static_cast<unsigned int>(axis))
{
shape[i] = 1;
}
else
{
shape[i] = inputTensorInfo.GetShape()[inputShapeIndex];
++inputShapeIndex;
}
}
ReshapeDescriptor reshapeDesc;
reshapeDesc.m_TargetShape = TensorShape(static_cast<unsigned int>(outputRank), shape.data());
outputTensorInfo.SetShape(reshapeDesc.m_TargetShape);
IConnectableLayer* layer = m_Network->AddReshapeLayer(reshapeDesc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
} layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto outputTensorIds = GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex);
m_TensorInfos[outputTensorIds[0]] = outputTensorInfo;
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseTranspose(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1, 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Transpose:{}:{}", subgraphIndex, operatorIndex);
TransposeDescriptor desc;
if (inputs.size() == 2)
{
armnn::TensorInfo permuteTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
BufferRawPtr permuteBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
auto numPermVecElements = permuteTensorInfo.GetNumElements();
std::vector<unsigned int> permuteShape(numPermVecElements);
::memcpy(permuteShape.data(), permuteBufferPtr->data.data(), permuteTensorInfo.GetNumBytes());
PermutationVector permutationVector(permuteShape.data(), permuteTensorInfo.GetNumElements());
desc = TransposeDescriptor(permutationVector);
}
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
IConnectableLayer* layer = m_Network->AddTransposeLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseTransposeConv(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsTransposeConvOptions();
TransposeConvolution2dDescriptor desc;
desc.m_BiasEnabled = false;
desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
desc.m_DataLayout = armnn::DataLayout::NHWC;
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
if (inputs.size() == 4)
{
desc.m_BiasEnabled = true;
}
else
{
CHECK_VALID_SIZE(inputs.size(), 3);
}
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
armnn::TensorInfo filterTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
// TfLite uses NHWC tensors
const unsigned int inputHeight = inputTensorInfo.GetShape()[1];
const unsigned int inputWidth = inputTensorInfo.GetShape()[2];
const unsigned int filterHeight = filterTensorInfo.GetShape()[1];
const unsigned int filterWidth = filterTensorInfo.GetShape()[2];
// This block determines the output shape of the transpose convolution. If the output shape tensor ptr is not null
// And the tensor is a constant, we can access the data at load time and set the output shape of the
// layer. If this is not constant, We do not have access to the shape data, so we have to use
// infer output shape and skip this code block.
if (inputs[0] && IsConstTensor(inputs[0]))
{
armnn::TensorInfo tensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
std::vector<int> output_shape(tensorInfo.GetNumElements());
if (tensorInfo.GetDataType() == DataType::Signed32)
{
::memcpy(output_shape.data(), GetBuffer(m_Model, inputs[0]->buffer)->data.data(), tensorInfo.GetNumBytes());
}
if (tensorInfo.GetDataType() == DataType::QAsymmU8)
{
for(unsigned int i=0; i < tensorInfo.GetNumElements(); i++)
{
output_shape[i] = GetBuffer(m_Model, inputs[0]->buffer)->data.data()[i];
}
}
// Change from signed to unsigned int to store in TransposeConvolution2dDescriptor.
for (int dimension : output_shape)
{
desc.m_OutputShape.push_back(static_cast<unsigned int>(dimension));
}
desc.m_OutputShapeEnabled = true;
// TfLite uses NHWC tensors
const unsigned int outputHeight = desc.m_OutputShape[1];
const unsigned int outputWidth = desc.m_OutputShape[2];
CalcPadding(inputHeight,
filterHeight,
desc.m_StrideY,
1, // DilationY
desc.m_PadTop,
desc.m_PadBottom,
options->padding,
outputHeight);
CalcPadding(inputWidth,
filterWidth,
desc.m_StrideX,
1, // DilationX
desc.m_PadLeft,
desc.m_PadRight,
options->padding,
outputWidth);
}
else
{
CalcPadding(inputHeight,
filterHeight,
desc.m_StrideY,
1, // DilationY
desc.m_PadTop,
desc.m_PadBottom,
options->padding);
CalcPadding(inputWidth,
filterWidth,
desc.m_StrideX,
1, // DilationX
desc.m_PadLeft,
desc.m_PadRight,
options->padding);
}
auto filterTensorAndData = CreateConstTensorNonPermuted(inputs[1], filterTensorInfo, inputTensorInfo.GetDataType());
armnn::IConnectableLayer* layer = nullptr;
auto layerName = fmt::format("TransposeConv:{}:{}", subgraphIndex, operatorIndex);
if (desc.m_BiasEnabled)
{
auto biasTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 3);
auto biasConstTensor = CreateConstTensorNonPermuted(inputs[3], biasTensorInfo, inputTensorInfo.GetDataType());
layer = m_Network->AddTransposeConvolution2dLayer(desc,
filterTensorAndData.first,
biasConstTensor.first,
layerName.c_str());
}
else
{
layer = m_Network->AddTransposeConvolution2dLayer(desc,
filterTensorAndData.first,
EmptyOptional(),
layerName.c_str());
}
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0 , { 2, 1 });
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// only the tensors for the inputs are relevant, exclude the const (filter) tensor
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[2]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseAveragePool2D(size_t subgraphIndex, size_t operatorIndex)
{
ParsePool(subgraphIndex, operatorIndex, PoolingAlgorithm::Average);
}
void TfLiteParserImpl::ParseBatchMatMul(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("BatchMatMul:{}:{}", subgraphIndex, operatorIndex);
TensorInfo inputXTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
TensorInfo inputYTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsBatchMatMulOptions();
// Adjoint in tensorflow lite performs transpose operation
BatchMatMulDescriptor descriptor(options->adj_x,
options->adj_y,
false,
false);
// Arbitrary DataLayout
IConnectableLayer* layer = m_Network->AddBatchMatMulLayer(descriptor, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseBatchToSpaceND(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 3);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo blockShapeTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
BufferRawPtr blockShapeBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
armnn::TensorInfo cropsTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
BufferRawPtr cropsBufferPtr = GetBuffer(m_Model, inputs[2]->buffer);
std::vector<unsigned int> blockShape(blockShapeTensorInfo.GetNumElements());
::memcpy(blockShape.data(), blockShapeBufferPtr->data.data(), blockShapeTensorInfo.GetNumBytes());
std::vector<unsigned int> cropsVector(cropsTensorInfo.GetNumElements());
::memcpy(cropsVector.data(), cropsBufferPtr->data.data(), cropsTensorInfo.GetNumBytes());
size_t step = 2;
std::vector<std::pair<unsigned int, unsigned int>> crops;
for (unsigned int i = 0; i < cropsTensorInfo.GetNumElements() / step; ++i)
{
crops.emplace_back(cropsVector[i * step], cropsVector[i * step + 1]);
}
armnn::BatchToSpaceNdDescriptor desc;
desc.m_BlockShape = blockShape;
desc.m_Crops = crops;
desc.m_DataLayout = armnn::DataLayout::NHWC;
auto layerName = fmt::format("BatchToSpaceND:{}:{}", subgraphIndex, operatorIndex);
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
IConnectableLayer* layer = m_Network->AddBatchToSpaceNdLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseBroadcastTo(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]);
TensorInfo shapeTensorInfo = ToTensorInfo(inputs[1]);
TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
auto layerName = fmt::format("Broadcast_to:{}:{}", subgraphIndex, operatorIndex);
BroadcastToDescriptor descriptor;
auto shapeBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
if (shapeBufferPtr != nullptr)
{
std::vector<unsigned int> targetShape;
unsigned int numElement = shapeTensorInfo.GetNumElements();
auto shapeData = reinterpret_cast<const int32_t*>(shapeBufferPtr->data.data());
if (shapeData)
{
for (unsigned int i = 0; i < numElement; ++i)
{
targetShape.push_back(armnn::numeric_cast<unsigned int>(shapeData[i]));
}
descriptor.m_BroadcastToShape = TensorShape(numElement, targetShape.data());
}
/// get dataShape from outputShape if missing
else
{
if(outputTensorInfo.GetShape().GetNumElements() <= 1)
{
ARMNN_THROW_PARSE_EXCEPTION("For Broadcast_to layer, "
"data and output shape are not found in the buffer.");
}
descriptor.m_BroadcastToShape = outputTensorInfo.GetShape();
}
}
else
{
ARMNN_THROW_PARSE_EXCEPTION("For Broadcast_to layer, Shape data was not found in the buffer.");
}
IConnectableLayer* layer = m_Network->AddBroadcastToLayer(descriptor, layerName.c_str());
ARMNN_ASSERT(layer != nullptr);
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseL2Normalization(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
L2NormalizationDescriptor desc;
desc.m_DataLayout = armnn::DataLayout::NHWC;
auto layerName = fmt::format("L2Normalization:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddL2NormalizationLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseMaxPool2D(size_t subgraphIndex, size_t operatorIndex)
{
ParsePool(subgraphIndex, operatorIndex, PoolingAlgorithm::Max);
}
void TfLiteParserImpl::ParseMaximum(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Maximum:{}:{}", subgraphIndex, operatorIndex);
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
CheckMatchingQuantization(inputTensorInfo, input1TensorInfo, layerName, "Input 0", "Input 1");
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Maximum, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseMinimum(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Minimum:{}:{}", subgraphIndex, operatorIndex);
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
CheckMatchingQuantization(inputTensorInfo, input1TensorInfo, layerName, "Input 0", "Input 1");
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Minimum, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParsePool(size_t subgraphIndex,
size_t operatorIndex,
PoolingAlgorithm algorithm)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsPool2DOptions();
CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
std::string layerName;
switch (algorithm)
{
case PoolingAlgorithm::Average:
layerName =
fmt::format("AveragePool2D:{}:{}", subgraphIndex, operatorIndex);
break;
case PoolingAlgorithm::Max:
layerName =
fmt::format("MaxPool2D:{}:{}", subgraphIndex, operatorIndex);
break;
default:
throw ParseException(fmt::format("Unsupported Pooling Algorithm {}", CHECK_LOCATION().AsString()));
}
Pooling2dDescriptor desc;
desc.m_PoolType = algorithm;
desc.m_StrideX = CHECKED_NON_NEGATIVE(options->stride_w);
desc.m_StrideY = CHECKED_NON_NEGATIVE(options->stride_h);
desc.m_PoolWidth = CHECKED_NON_NEGATIVE(options->filter_width);
desc.m_PoolHeight = CHECKED_NON_NEGATIVE(options->filter_height);
desc.m_PaddingMethod = PaddingMethod::Exclude;
desc.m_OutputShapeRounding = OutputShapeRounding::Floor;
desc.m_DataLayout = armnn::DataLayout::NHWC;
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
// assuming input is NHWC
unsigned int inputHeight = inputTensorInfo.GetShape()[1];
unsigned int inputWidth = inputTensorInfo.GetShape()[2];
CalcPadding(inputHeight, desc.m_PoolHeight, desc.m_StrideY, 1u,
desc.m_PadTop, desc.m_PadBottom, options->padding);
CalcPadding(inputWidth, desc.m_PoolWidth, desc.m_StrideX, 1u,
desc.m_PadLeft, desc.m_PadRight, options->padding);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
IConnectableLayer* layer = m_Network->AddPooling2dLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
// register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseSlice(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 3);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
SliceDescriptor desc;
// set begin tensor info for slice descriptor
armnn::TensorInfo beginTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
BufferRawPtr beginBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
std::vector<unsigned int> begin(beginTensorInfo.GetNumElements());
::memcpy(begin.data(), beginBufferPtr->data.data(), beginTensorInfo.GetNumBytes());
// set size tensor info for slice descriptor
armnn::TensorInfo sizeTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
BufferRawPtr sizeBufferPtr = GetBuffer(m_Model, inputs[2]->buffer);
std::vector<int> signedSize(sizeTensorInfo.GetNumElements(), 1);
// if size buffer data is not specified, all contents of size vector remain as values of 1
if (sizeBufferPtr->data.data())
{
::memcpy(signedSize.data(), sizeBufferPtr->data.data(), sizeTensorInfo.GetNumBytes());
}
std::vector<unsigned int> size(sizeTensorInfo.GetNumElements());
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
for (unsigned int i = 0; i < signedSize.size(); ++i)
{
int signedValue = signedSize[i];
if (signedValue < -1 || signedValue > static_cast<int>(inputTensorInfo.GetShape()[i] - begin[i]))
{
throw ParseException(fmt::format("Invalid value for size {} size must be in range "
"[-1, inputDimSize - begin] [-1, {}] inclusive {}",
signedValue,
inputTensorInfo.GetShape()[i] - begin[i],
CHECK_LOCATION().AsString()));
}
if (signedValue == -1)
{
size[i] = inputTensorInfo.GetShape()[i] - begin[i];
}
else
{
size[i] = static_cast<unsigned int>(signedValue);
}
}
desc = SliceDescriptor(begin, size);
auto layerName = fmt::format("Slice:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* const layer = m_Network->AddSliceLayer(desc, layerName.c_str());
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
// register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseSoftmax(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsSoftmaxOptions();
SoftmaxDescriptor desc;
desc.m_Beta = options->beta;
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Softmax:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* const layer = m_Network->AddSoftmaxLayer(desc, layerName.c_str());
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
// register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseLogSoftmax(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
LogSoftmaxDescriptor desc;
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("LogSoftmax:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* const layer = m_Network->AddLogSoftmaxLayer(desc, layerName.c_str());
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
// register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseScatterNd(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
TfLiteParserImpl::TensorRawPtrVector inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 3);
TfLiteParserImpl::TensorRawPtrVector outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo indicesTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo updatesTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
armnn::TensorInfo shapeTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
// TFLite currently only have these options: update and no input given, just shape.
armnn::ScatterNdDescriptor descriptor(armnn::ScatterNdFunction::Update, false);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsScatterNdOptions();
IgnoreUnused(options);
auto layerName = fmt::format("ScatterND:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddScatterNdLayer(descriptor, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1, 2});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex,
operatorIndex,
layer,
{inputTensorIndexes[2], inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseSpaceToBatchND(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 3);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo blockShapeTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
BufferRawPtr blockShapeBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
armnn::TensorInfo padListTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
BufferRawPtr padListBufferPtr = GetBuffer(m_Model, inputs[2]->buffer);
std::vector<unsigned int> blockShape(blockShapeTensorInfo.GetNumElements());
::memcpy(blockShape.data(), blockShapeBufferPtr->data.data(), blockShapeTensorInfo.GetNumBytes());
std::vector<unsigned int> padListVector(padListTensorInfo.GetNumElements());
::memcpy(padListVector.data(), padListBufferPtr->data.data(), padListTensorInfo.GetNumBytes());
size_t step = 2;
std::vector<std::pair<unsigned int, unsigned int>> padList;
for (unsigned int i = 0; i < padListTensorInfo.GetNumElements() / step; ++i)
{
padList.emplace_back(padListVector[i * step], padListVector[i * step + 1]);
}
armnn::SpaceToBatchNdDescriptor desc;
desc.m_BlockShape = blockShape;
desc.m_PadList = padList;
desc.m_DataLayout = armnn::DataLayout::NHWC;
auto layerName = fmt::format("SpaceToBatchND:{}:{}", subgraphIndex, operatorIndex);
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
IConnectableLayer* layer = m_Network->AddSpaceToBatchNdLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseSpaceToDepth(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
TfLiteParserImpl::TensorRawPtrVector inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
TfLiteParserImpl::TensorRawPtrVector outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::SpaceToDepthDescriptor descriptor;
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsSpaceToDepthOptions();
auto blockSize = options->block_size;
if (blockSize < 2)
{
throw ParseException(
fmt::format("Operation has invalid block size: {} Block size should be >= 2 {}",
blockSize,
CHECK_LOCATION().AsString()));
}
descriptor.m_BlockSize = armnn::numeric_cast<uint32_t>(blockSize);
auto layerName = fmt::format("SpaceToDepth:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddSpaceToDepthLayer(descriptor, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
armnn::TensorInfo TfLiteParserImpl::OutputShapeOfSqueeze(std::vector<uint32_t> squeezeDims,
const armnn::TensorInfo& inputTensorInfo)
{
CHECK_VALID_SIZE(squeezeDims.size(), 0, 1, 2, 3, 4);
static const uint32_t dimensionSequence[] = { 0, 1, 2, 3 };
if (inputTensorInfo.GetNumDimensions() > 4)
{
std::stringstream ss;
ss << "Input tensor has unexpected number of dimensions:" << inputTensorInfo.GetNumDimensions()
<< " shape:" << inputTensorInfo.GetShape() << " "
<< CHECK_LOCATION().AsString();
throw ParseException(ss.str());
}
if (squeezeDims.empty())
{
squeezeDims.assign(dimensionSequence,
dimensionSequence+inputTensorInfo.GetNumDimensions());
}
std::vector<uint32_t> outputDims;
for(unsigned int i = 0; i < inputTensorInfo.GetNumDimensions(); i++)
{
bool skipSqueeze = (std::find(squeezeDims.begin(), squeezeDims.end(), i) == squeezeDims.end());
auto currentDimension = inputTensorInfo.GetShape()[i];
if (skipSqueeze || currentDimension != 1)
{
outputDims.push_back(currentDimension);
}
}
if (outputDims.size() > 4)
{
std::stringstream ss;
ss << "Output tensor has unexpected number of dimensions:" << inputTensorInfo.GetNumDimensions()
<< " shape:" << inputTensorInfo.GetShape() << " "
<< CHECK_LOCATION().AsString();
throw ParseException(ss.str());
}
TensorShape outShape = TensorShape(static_cast<unsigned int>(outputDims.size()),
outputDims.data());
// we need to preserve the tensor type and the quantization data as well
TensorInfo outTensorInfo = inputTensorInfo;
outTensorInfo.SetShape(outShape);
return outTensorInfo;
}
void TfLiteParserImpl::ParseShape(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Shape:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddShapeLayer(layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// Check if output tensor type is Signed32 or Signed64
if (outputTensorInfo.GetDataType() != armnn::DataType::Signed32 &&
outputTensorInfo.GetDataType() != armnn::DataType::Signed64)
{
throw ParseException(
fmt::format(
"Output tensor data type is not supported. (Supported types: Signed32 & Signed64) {}",
CHECK_LOCATION().AsString()));
}
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseSqueeze(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto * options = operatorPtr->builtin_options.AsSqueezeOptions();
auto layerName = fmt::format("Squeeze:{}:{}", subgraphIndex, operatorIndex);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
std::vector<uint32_t> squeezeDim;
// A single negative dim index is interpreted as a negative index in python
// Meaning the index will be the shape size plus the negative index value
if (options->squeeze_dims.size() == 1 && options->squeeze_dims[0] < 0)
{
int32_t dim = static_cast<int32_t>(inputTensorInfo.GetShape().GetNumDimensions()) + options->squeeze_dims[0];
squeezeDim.push_back(static_cast<uint32_t>(dim));
}
else
{
squeezeDim = AsUnsignedVector(options->squeeze_dims);
}
armnn::TensorInfo outputTensorInfo = TfLiteParserImpl::OutputShapeOfSqueeze(squeezeDim, inputTensorInfo);
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
ReshapeDescriptor reshapeDesc;
reshapeDesc.m_TargetShape = outputTensorInfo.GetShape();
auto outputTensorIds = GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex);
m_TensorInfos[outputTensorIds[0]] = outputTensorInfo;
IConnectableLayer* layer = m_Network->AddReshapeLayer(reshapeDesc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseStridedSlice(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 4);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsStridedSliceOptions();
StridedSliceDescriptor desc;
desc.m_BeginMask = options->begin_mask;
desc.m_EllipsisMask = options->ellipsis_mask;
desc.m_EndMask = options->end_mask;
desc.m_NewAxisMask = options->new_axis_mask;
desc.m_ShrinkAxisMask = options->shrink_axis_mask;
desc.m_DataLayout = armnn::DataLayout::NHWC;
armnn::TensorInfo beginTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
BufferRawPtr beginBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
std::vector<int> begin(beginTensorInfo.GetNumElements());
if (beginBufferPtr->data.data() != nullptr)
{
::memcpy(begin.data(), beginBufferPtr->data.data(), beginTensorInfo.GetNumBytes());
}
else
{
throw ParseException("ParseStridedSlice: Invalid input - the begin vector is null");
}
armnn::TensorInfo endTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
BufferRawPtr endBufferPtr = GetBuffer(m_Model, inputs[2]->buffer);
std::vector<int> end(endTensorInfo.GetNumElements());
if (endBufferPtr->data.data() != nullptr)
{
::memcpy(end.data(), endBufferPtr->data.data(), endTensorInfo.GetNumBytes());
}
else
{
throw ParseException("ParseStridedSlice: Invalid input - the end vector is null");
}
armnn::TensorInfo strideTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 3);
BufferRawPtr strideBufferPtr = GetBuffer(m_Model, inputs[3]->buffer);
std::vector<int> stride(strideTensorInfo.GetNumElements());
if (strideBufferPtr->data.data() != nullptr)
{
::memcpy(stride.data(), strideBufferPtr->data.data(), strideTensorInfo.GetNumBytes());
}
else
{
throw ParseException("ParseStridedSlice: Invalid input - the stride vector is null");
}
desc.m_Begin = begin;
desc.m_End = end;
desc.m_Stride = stride;
auto layerName = fmt::format("StridedSlice:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddStridedSliceLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseSub(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsSubOptions();
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
auto layerName = fmt::format("Sub:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Sub, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
if (options)
{
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
}
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseDiv(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsDivOptions();
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
auto layerName = fmt::format("Div:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Div, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
if (options)
{
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
}
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseFloorDiv(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
auto layerName = fmt::format("Div:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Div, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
layer = AddFusedFloorLayer(layer, 0);
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseAdd(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsAddOptions();
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
auto layerName = fmt::format("Add:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Add, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
if (options)
{
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
}
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseMul(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsMulOptions();
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
auto layerName = fmt::format("Mul:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Mul, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
if (options)
{
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
}
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseMean(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
TensorInfo dimTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
armnn::MeanDescriptor desc;
BufferRawPtr axisBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
// Get const axis value from model and set it to descriptor.
if (axisBufferPtr != nullptr)
{
std::vector<int32_t> axisData(dimTensorInfo.GetNumElements());
::memcpy(axisData.data(), axisBufferPtr->data.data(), dimTensorInfo.GetNumBytes());
// Convert the axis to unsigned int and remove duplicates.
auto rank = static_cast<int32_t>(inputTensorInfo.GetNumDimensions());
std::set<unsigned int> uniqueAxis;
std::transform(axisData.begin(),
axisData.end(),
std::inserter(uniqueAxis, uniqueAxis.begin()),
[rank](int i)->unsigned int{
return static_cast<uint32_t>(((i + rank) % rank)); });
desc.m_Axis.assign(uniqueAxis.begin(), uniqueAxis.end());
}
else
{
for (uint32_t i = 0; i < inputTensorInfo.GetNumDimensions(); ++i)
{
desc.m_Axis.push_back(i);
}
}
armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0], true);
desc.m_KeepDims = inputTensorInfo.GetNumDimensions() == outputTensorInfo.GetNumDimensions() ? true : false;
auto layerName = fmt::format("Mean:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddMeanLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParsePad(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
TfLiteParserImpl::TensorRawPtrVector inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
TfLiteParserImpl::TensorRawPtrVector outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo padTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
std::vector<unsigned int> padBuffer = GetUIntBuffer(padTensorInfo, m_Model, inputs[1]->buffer);
size_t step = 2;
armnn::PadDescriptor desc;
auto opcode = GetOpCode(m_Model, subgraphIndex, operatorIndex);
if (opcode == tflite::BuiltinOperator_PAD)
{
CHECK_VALID_SIZE(inputs.size(), 2);
if (inputTensorInfo.IsQuantized())
{
desc.m_PadValue = static_cast<float>(inputTensorInfo.GetQuantizationOffset());
}
}
else if (opcode == tflite::BuiltinOperator_PADV2)
{
CHECK_VALID_SIZE(inputs.size(), 3);
armnn::TensorInfo padValueTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
if (padValueTensorInfo.GetNumElements() != 1)
{
ARMNN_THROW_PARSE_EXCEPTION("Multiple padding values are not supported in PADV2");
}
BufferRawPtr padValueBufferPtr = GetBuffer(m_Model, inputs[2]->buffer);
// Get the pad value from the input tensor
if (padValueBufferPtr->data.size() > 0)
{
switch (padValueTensorInfo.GetDataType())
{
case armnn::DataType::Float32:
{
std::vector<float> padValueBuffer(padValueTensorInfo.GetNumElements());
::memcpy(padValueBuffer.data(), padValueBufferPtr->data.data(), padValueBufferPtr->data.size());
desc.m_PadValue = padValueBuffer[0];
break;
}
case armnn::DataType::QAsymmU8:
{
std::vector<uint8_t> padValueBuffer(padValueTensorInfo.GetNumElements());
::memcpy(padValueBuffer.data(), padValueBufferPtr->data.data(), padValueBufferPtr->data.size());
desc.m_PadValue = armnn::Dequantize<uint8_t>(padValueBuffer[0],
padValueTensorInfo.GetQuantizationScale(),
padValueTensorInfo.GetQuantizationOffset());
break;
}
case armnn::DataType::QAsymmS8:
case armnn::DataType::QSymmS8:
{
std::vector<int8_t> padValueBuffer(padValueTensorInfo.GetNumElements());
::memcpy(padValueBuffer.data(), padValueBufferPtr->data.data(), padValueBufferPtr->data.size());
desc.m_PadValue = armnn::Dequantize<int8_t>(padValueBuffer[0],
padValueTensorInfo.GetQuantizationScale(),
padValueTensorInfo.GetQuantizationOffset());
break;
}
default: ARMNN_THROW_PARSE_EXCEPTION("Unsupported DataType");
}
}
else if (inputTensorInfo.IsQuantized())
{
desc.m_PadValue = static_cast<float>(inputTensorInfo.GetQuantizationOffset());
}
}
for (unsigned int i = 0; i < padTensorInfo.GetNumElements() / step; ++i)
{
desc.m_PadList.emplace_back(padBuffer[i * step], padBuffer[i * step + 1]);
}
auto layerName = (opcode == tflite::BuiltinOperator_PAD) ? fmt::format("Pad:{}:{}", subgraphIndex, operatorIndex)
: fmt::format("PadV2:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddPadLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseMirrorPad(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
TfLiteParserImpl::TensorRawPtrVector inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
TfLiteParserImpl::TensorRawPtrVector outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo padTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
BufferRawPtr bufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
std::vector<unsigned int> padBuffer(padTensorInfo.GetNumElements());
::memcpy(padBuffer.data(), bufferPtr->data.data(), padTensorInfo.GetNumBytes());
size_t step = 2;
armnn::PadDescriptor desc;
for (unsigned int i = 0; i < padTensorInfo.GetNumElements() / step; ++i)
{
desc.m_PadList.emplace_back(padBuffer[i * step], padBuffer[i * step + 1]);
}
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsMirrorPadOptions();
if (options->mode == tflite::MirrorPadMode_REFLECT)
{
desc.m_PaddingMode = PaddingMode::Reflect;
}
else if (options->mode == tflite::MirrorPadMode_SYMMETRIC)
{
desc.m_PaddingMode = PaddingMode::Symmetric;
}
else
{
ARMNN_THROW_PARSE_EXCEPTION("PaddingMode must be either REFLECT or SYMMETRIC");
}
// If padding mode is Reflect then both paddings must be no greater than inputShape(i) - 1.
// If padding mode is Symmetric then both paddings must be no greater than inputShape(i).
auto inputShape = inputTensorInfo.GetShape();
auto padList = desc.m_PadList;
const unsigned int isReflect = static_cast<unsigned int>(desc.m_PaddingMode == PaddingMode::Reflect);
for(unsigned int i = 0; i < padList.size(); ++i)
{
if(padList.at(i).first > (inputShape[i] - isReflect) ||
padList.at(i).second > (inputShape[i] - isReflect))
{
ARMNN_THROW_PARSE_EXCEPTION("Padding values must be less (Reflect) or "
"equal (Symmetric) to the dimension size.");
}
}
auto layerName = fmt::format("MirrorPad:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddPadLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParsePrelu(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Prelu:{}:{}", subgraphIndex, operatorIndex);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo alphaTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
IConnectableLayer* layer = m_Network->AddPreluLayer(layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
if (IsConstTensor(inputs[1]))
{
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
armnn::IInputSlot* slot = &(layer->GetInputSlot(0));
RegisterConsumerOfTensor(subgraphIndex, inputTensorIndexes[0], slot);
auto alphaTensorAndData = CreateConstTensorNonPermuted(inputs[1], alphaTensorInfo,
inputTensorInfo.GetDataType());
std::string constLayerName = fmt::format("Constant:{}", inputs[1]->name);
IConnectableLayer* constLayer =
m_Network->AddConstantLayer(alphaTensorAndData.first, constLayerName.c_str());
if (!constLayer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
constLayer->GetOutputSlot(0).SetTensorInfo(alphaTensorInfo);
constLayer->GetOutputSlot(0).Connect(layer->GetInputSlot(1));
RegisterOutputSlots(subgraphIndex,
VIRTUAL_OPERATOR_ID,
constLayer,
{ inputTensorIndexes[1] });
}
else
{
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, inputTensorIndexes);
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseQuantize(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Quantize:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddQuantizeLayer(layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseRelu(size_t subgraphIndex, size_t operatorIndex)
{
ParseActivation(subgraphIndex,operatorIndex, ActivationFunction::ReLu);
}
void TfLiteParserImpl::ParseRelu6(size_t subgraphIndex, size_t operatorIndex)
{
ParseActivation(subgraphIndex,operatorIndex, ActivationFunction::BoundedReLu);
}
void TfLiteParserImpl::ParseLeakyRelu(size_t subgraphIndex, size_t operatorIndex)
{
ParseActivation(subgraphIndex, operatorIndex, ActivationFunction::LeakyReLu);
}
void TfLiteParserImpl::ParseLogistic(size_t subgraphIndex, size_t operatorIndex)
{
ParseActivation(subgraphIndex,operatorIndex,ActivationFunction::Sigmoid);
}
void TfLiteParserImpl::ParseTanH(size_t subgraphIndex, size_t operatorIndex)
{
ParseActivation(subgraphIndex,operatorIndex,ActivationFunction::TanH);
}
void TfLiteParserImpl::ParseElu(size_t subgraphIndex, size_t operatorIndex)
{
ParseActivation(subgraphIndex, operatorIndex, ActivationFunction::Elu);
}
void TfLiteParserImpl::ParseHardSwish(size_t subgraphIndex, size_t operatorIndex)
{
ParseActivation(subgraphIndex, operatorIndex, ActivationFunction::HardSwish);
}
void TfLiteParserImpl::ParseGelu(size_t subgraphIndex, size_t operatorIndex)
{
ParseActivation(subgraphIndex,operatorIndex,ActivationFunction::Gelu);
}
void TfLiteParserImpl::ParseActivation(size_t subgraphIndex, size_t operatorIndex, ActivationFunction activationType)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
IgnoreUnused(operatorPtr);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Activation:");
ActivationDescriptor activationDesc;
activationDesc.m_Function = activationType;
switch (activationType)
{
case ActivationFunction::ReLu:
{
layerName += fmt::format("RELU:{}:{}", subgraphIndex, operatorIndex);
break;
}
case ActivationFunction::BoundedReLu:
{
layerName += fmt::format("RELU6:{}:{}", subgraphIndex, operatorIndex);
activationDesc.m_A = 6.0f;
activationDesc.m_B = 0.0f;
break;
}
case ActivationFunction::Sigmoid:
{
layerName += fmt::format("SIGMOID:{}:{}", subgraphIndex, operatorIndex);
break;
}
case ActivationFunction::TanH:
{
layerName += fmt::format("TANH:{}:{}", subgraphIndex, operatorIndex);
activationDesc.m_A = 1.0f;
activationDesc.m_B = 1.0f;
break;
}
case ActivationFunction::LeakyReLu:
{
layerName += fmt::format("LEAKYRELU:{}:{}", subgraphIndex, operatorIndex);
const auto* options = operatorPtr->builtin_options.AsLeakyReluOptions();
activationDesc.m_A = options->alpha;
break;
}
case ActivationFunction::Elu:
{
layerName += fmt::format("ELU:{}:{}", subgraphIndex, operatorIndex);
activationDesc.m_A = 1.0f;
break;
}
case ActivationFunction::HardSwish:
{
layerName += fmt::format("HARDSWISH:{}:{}", subgraphIndex, operatorIndex);
break;
}
case ActivationFunction::Gelu:
{
layerName += fmt::format("GELU:{}:{}", subgraphIndex, operatorIndex);
break;
}
default:
{
throw ParseException(
fmt::format("Unexpected ActivationFunction[{}] when creating layerName {} ",
static_cast<int>(activationType), CHECK_LOCATION().AsString()));
}
}
IConnectableLayer* const layer = m_Network->AddActivationLayer(activationDesc, layerName.c_str());
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
// register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
armnn::TensorInfo TfLiteParserImpl::OutputShapeOfReshape(const armnn::TensorInfo& inputTensorInfo,
const std::vector<int32_t>& targetDimsIn)
{
std::vector<unsigned int> outputDims(targetDimsIn.begin(), targetDimsIn.end());
const auto stretchDim = std::find(targetDimsIn.begin(), targetDimsIn.end(), -1);
if (stretchDim != targetDimsIn.end())
{
if (std::find(std::next(stretchDim), targetDimsIn.end(), -1) != targetDimsIn.end())
{
throw ParseException(
fmt::format("At most one component of shape can be -1 {}", CHECK_LOCATION().AsString()));
}
auto targetNumElements =
armnn::numeric_cast<unsigned int>(
std::accumulate(targetDimsIn.begin(), targetDimsIn.end(), -1, std::multiplies<int32_t>()));
auto stretchIndex = static_cast<size_t>(std::distance(targetDimsIn.begin(), stretchDim));
if (targetNumElements == 0)
{
if (inputTensorInfo.GetNumElements() == 0)
{
outputDims[stretchIndex] = 0;
}
else
{
throw ParseException(
fmt::format("Input to reshape is a tensor with elements, but the requested shape has 0. {}",
CHECK_LOCATION().AsString()));
}
}
else
{
outputDims[stretchIndex] = inputTensorInfo.GetNumElements() / targetNumElements;
}
}
TensorShape outputShape = TensorShape(static_cast<unsigned int>(outputDims.size()), outputDims.data());
TensorInfo reshapeInfo = inputTensorInfo;
reshapeInfo.SetShape(outputShape);
return reshapeInfo;
}
void TfLiteParserImpl::ParseReshape(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsReshapeOptions();
auto layerName = fmt::format("Reshape:{}:{}", subgraphIndex, operatorIndex);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo actualOutputTensorInfo = ToTensorInfo(outputs[0]);
CheckMatchingQuantization(inputTensorInfo, actualOutputTensorInfo, layerName, "Input 0", "Output 0");
// Extracting new shape for the output
// There are two ways it can be passed
// * First is to define the target shape in the operator built-in options
// * Second is to pass it as a second input tensor
std::vector<int32_t> targetShape;
bool targetShapeFound = false;
// Check if built-in options were given
if (options != nullptr)
{
// make sure the parameter is given
if (options->new_shape.empty() == false)
{
targetShape = options->new_shape;
targetShapeFound = true;
}
}
// If there is no built-in option given or if the built-in new_shape parameter was empty
if (!targetShapeFound)
{
// Check for a second input tensor
if (inputs.size() > 1 && inputs[1] != nullptr)
{
if (inputs[1]->is_variable)
{
ARMNN_THROW_PARSE_EXCEPTION( "Target shapes defined in non-const input tensors is not supported");
}
if (inputs[1]->shape.size() != 1)
{
ARMNN_THROW_PARSE_EXCEPTION("Target 'shape' input is not a 1D tensor");
}
if (inputs[1]->type != tflite::TensorType_INT32)
{
ARMNN_THROW_PARSE_EXCEPTION("Target 'shape' input is not an int32 type");
}
// Extract target shape from input
auto bufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
auto values = reinterpret_cast<const int32_t*>(bufferPtr->data.data());
if (values)
{
for (int i = 0; i < inputs[1]->shape[0]; ++i)
{
targetShape.push_back(values[i]);
}
}
else
{
try
{
// We attempt to infer during Runtime.
TensorShape reshapeShapes = ToTensorInfo(inputs[1]).GetShape();
if (reshapeShapes[0] == actualOutputTensorInfo.GetNumDimensions())
{
for (unsigned int i = 0; i < actualOutputTensorInfo.GetShape().GetNumDimensions(); ++i)
{
targetShape.push_back(actualOutputTensorInfo.GetShape()[i]);
}
}
// The parser only supports shape (batch, -1) or (-1) for non-constant shape input.
else if (reshapeShapes[0] > 2)
{
throw ParseException(fmt::format("Invalid input shape '{}' in Reshape layer '{}' {}. "
"When inferring during runtime, the parser only supports "
"shape (batch, -1) or (-1) for target shape input.",
reshapeShapes[0],
layerName,
CHECK_LOCATION().AsString()));
}
else
{
const int32_t numInputElements = inputTensorInfo.GetNumElements();
const int32_t inputTensorShape = inputTensorInfo.GetShape()[0];
if (reshapeShapes[0] == 1)
{
targetShape = {numInputElements};
}
else if (reshapeShapes[0] == 2)
{
targetShape = {inputTensorShape, numInputElements / inputTensorShape};
}
}
}
catch (const std::exception& exc)
{
ARMNN_THROW_PARSE_EXCEPTION("Failed attempt to infer during runtime the target shape input for "
"Reshape operation. Reshape operator target shape input buffer data "
"is null. " << exc.what());
}
}
}
else
{
ARMNN_THROW_PARSE_EXCEPTION("Target shape not defined in reshape parameters or input tensor. "
"At least one method required");
}
}
armnn::TensorInfo reshapeOutputTensorInfo =
TfLiteParserImpl::OutputShapeOfReshape(inputTensorInfo, targetShape);
// Check for valid input size and that reshape parameters equal output shape
// The output shape can be provided to us in 2 ways:
// 1. through the normal 'shape' parameter given by outputs[indx]->shape
// 2. through additional parameter 'shape_signature' given by outputs[indx]->buffer.
// This parameter can sometimes contain -1 value not visible in the 'shape' parameter.
const armnn::TensorShape& reshapeOutputTensorShape = reshapeOutputTensorInfo.GetShape();
if (inputs.size() > 1 && !CheckShape(reshapeOutputTensorShape, outputs[0]->shape))
{
// Attempt to extract output shape from secondary 'shape_signature'
// parameter and try to CheckShape() with this param.
std::vector<int32_t> secondaryOutputTargetShape = outputs[0]->shape_signature;
// if outputs[0]->shape_signature contain a -1 value, we need to compute its actual value
// from reshape input in order to correctly verify reshape parameters equal output shape
armnn::TensorInfo secondaryReshapeOutputTensorInfo =
TfLiteParserImpl::OutputShapeOfReshape(inputTensorInfo, secondaryOutputTargetShape);
if (!CheckShape(reshapeOutputTensorShape, secondaryReshapeOutputTensorInfo.GetShape()))
{
std::stringstream ss;
ss << "New shape defined in reshape parameters "
<< reshapeOutputTensorShape
<< " does not equal output shape "
<< actualOutputTensorInfo.GetShape()
<< ": "
<< CHECK_LOCATION().AsString();
throw ParseException(ss.str());
}
}
auto outputTensorIds = GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex);
ReshapeDescriptor reshapeDesc;
reshapeDesc.m_TargetShape = reshapeOutputTensorInfo.GetShape();
m_TensorInfos[outputTensorIds[0]] = reshapeOutputTensorInfo;
IConnectableLayer* layer = m_Network->AddReshapeLayer(reshapeDesc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
layer->GetOutputSlot(0).SetTensorInfo(reshapeOutputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseResizeBilinear(size_t subgraphIndex, size_t operatorIndex)
{
ParseResize(subgraphIndex, operatorIndex, ResizeMethod::Bilinear);
}
void TfLiteParserImpl::ParseResizeNearestNeighbor(size_t subgraphIndex, size_t operatorIndex)
{
ParseResize(subgraphIndex, operatorIndex, ResizeMethod::NearestNeighbor);
}
void TfLiteParserImpl::ParseResize(size_t subgraphIndex, size_t operatorIndex, ResizeMethod resizeMethod)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo sizeTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
// Data for the parsed tensor args (size) must be stored locally.
std::vector<int32_t> sizeTensorData(sizeTensorInfo.GetNumElements());
BufferRawPtr sizeBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
::memcpy(sizeTensorData.data(), sizeBufferPtr->data.data(), sizeTensorInfo.GetNumBytes());
ResizeDescriptor desc;
desc.m_Method = resizeMethod;
desc.m_TargetHeight = static_cast<uint32_t> (sizeTensorData[0]);
desc.m_TargetWidth = static_cast<uint32_t> (sizeTensorData[1]);
desc.m_DataLayout = armnn::DataLayout::NHWC;
auto layerName = fmt::format("Resize:");
switch (resizeMethod)
{
case ResizeMethod::Bilinear:
{
layerName += fmt::format("BILINEAR:{}:{}", subgraphIndex, operatorIndex);
const auto & operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto * options = operatorPtr->builtin_options.AsResizeBilinearOptions();
desc.m_AlignCorners = options->align_corners;
break;
}
case ResizeMethod::NearestNeighbor:
{
layerName += fmt::format("NEARESTNEIGHBOR:{}:{}", subgraphIndex, operatorIndex);
break;
}
default:
{
throw ParseException(
fmt::format("Unexpected ResizeMethod[{}] when creating layerName {} ",
static_cast<int>(resizeMethod), CHECK_LOCATION().AsString()));
}
}
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
IConnectableLayer* layer = m_Network->AddResizeLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseReverseV2(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("ReverseV2:{}:{}", subgraphIndex, operatorIndex);
TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]);
TensorInfo axisTensorInfo = ToTensorInfo(inputs[1]);
TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
IConnectableLayer* layer = m_Network->AddReverseV2Layer(layerName.c_str());
ARMNN_ASSERT(layer != nullptr);
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseTile(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
TensorInfo inputTensorInfo = ToTensorInfo(inputs[0]);
TensorInfo multiplesTensorInfo = ToTensorInfo(inputs[1]);
TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
auto layerName = fmt::format("Tile:{}:{}", subgraphIndex, operatorIndex);
TileDescriptor descriptor;
BufferRawPtr multiplesBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
if (multiplesBufferPtr != nullptr)
{
std::vector<int32_t> multiplesData(multiplesTensorInfo.GetNumElements());
::memcpy(multiplesData.data(), multiplesBufferPtr->data.data(), multiplesTensorInfo.GetNumBytes());
descriptor.m_Multiples.assign(multiplesData.begin(), multiplesData.end());
}
else
{
ARMNN_THROW_PARSE_EXCEPTION("For Tile layer, Multiples data was not found in the buffer.");
}
IConnectableLayer* layer = m_Network->AddTileLayer(descriptor, layerName.c_str());
ARMNN_ASSERT(layer != nullptr);
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseConcatenation(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsConcatenationOptions();
CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
auto inputTensorIds = GetInputTensorIds(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
unsigned int numConcatView = static_cast<unsigned int>(inputs.size());
uint32_t inputRank = InputTensorInfo(subgraphIndex, operatorIndex, 0).GetNumDimensions();
const unsigned int concatDimInput = static_cast<unsigned int>(
(static_cast<int>(inputRank) + options->axis) % static_cast<int>(inputRank));
OriginsDescriptor concatDescriptor(static_cast<uint32_t>(numConcatView), inputRank);
concatDescriptor.SetConcatAxis(concatDimInput);
unsigned int mergeDimOrigin = 0;
for (unsigned int viewIndex = 0; viewIndex < numConcatView; ++viewIndex)
{
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, viewIndex);
// This set up concatDescriptor view origin
armnnUtils::ProcessConcatInputTensorInfo(
inputTensorInfo, concatDescriptor, concatDimInput, viewIndex, mergeDimOrigin);
}
auto layerName = fmt::format("Concatenation:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddConcatLayer(concatDescriptor, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes});
// add fused activation layer
layer = AddFusedActivationLayer(layer, 0, options->fused_activation_function);
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseFullyConnected(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorRfr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto options = operatorRfr->builtin_options.AsFullyConnectedOptions();
CHECK_SUPPORTED_FUSED_ACTIVATION(options, subgraphIndex, operatorIndex);
FullyConnectedDescriptor desc;
desc.m_BiasEnabled = false;
desc.m_TransposeWeightMatrix = true;
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo filterTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
// Fully Connected Layer accepts two dimensional weights input
int32_t weightsDimension = static_cast<int32_t>(filterTensorInfo.GetNumDimensions());
if (weightsDimension != 2)
{
throw ParseException(
fmt::format("Dimension {} for Fully Connected weights is not supported by Armnn. "
"Node {}",
weightsDimension,
CHECK_LOCATION().AsString()));
}
armnn::IConnectableLayer* layer = nullptr;
auto layerName = fmt::format("FullyConnected:{}:{}", subgraphIndex, operatorIndex);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
// Add the first input tensor to the registration list
std::vector<unsigned int> tensorIndexesToRegister = {inputTensorIndexes[0]};
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
desc.m_ConstantWeights = IsConstTensor(inputs[1]);
// Add the weights input to the registration list, constant layers will be added by SetupConstantLayers if constant.
tensorIndexesToRegister.emplace_back(inputTensorIndexes[1]);
if (ShouldConstantTensorBeConverted(inputs[1], inputTensorInfo.GetDataType(), filterTensorInfo.GetDataType()))
{
m_ConstantsToDequantize.emplace_back(inputs[1]->buffer);
}
if (inputs.size() == 3)
{
desc.m_BiasEnabled = true;
armnn::TensorInfo biasTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
// Add the biases input to the registration list, constant layer will be added by SetupConstantLayers.
tensorIndexesToRegister.emplace_back(inputTensorIndexes[2]);
if (ShouldConstantTensorBeConverted(inputs[2], inputTensorInfo.GetDataType(), biasTensorInfo.GetDataType()))
{
m_ConstantsToDequantize.emplace_back(inputs[2]->buffer);
}
}
// Filters and biases are always passed to fully connected as inputs
layer = m_Network->AddFullyConnectedLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
unsigned int startingSlotIndex = 0;
if (inputTensorInfo.GetNumDimensions() > 2)
{
// Add reshape to flatten to 2D [batch_size, input_size],
// where "input_size" corresponds to the number of inputs to the layer,
// matching the second dimension of weights,
// and "batch_size" is calculated by dividing the number of elements by "input_size".
std::vector<unsigned int> reshapedDimensions(2);
reshapedDimensions[1] = filterTensorInfo.GetShape()[1];
reshapedDimensions[0] = inputTensorInfo.GetNumElements() / reshapedDimensions[1];
if (inputTensorInfo.GetNumElements() % reshapedDimensions[1] != 0)
{
throw ParseException(
fmt::format("Failed to deduce input tensor shape from filter size {} {}",
reshapedDimensions[1],
CHECK_LOCATION().AsString()));
}
armnn::TensorInfo reshapedTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
reshapedTensorInfo.SetShape(armnn::TensorShape{ 2, reshapedDimensions.data() });
inputTensorInfo = reshapedTensorInfo;
std::string reshapeLayerName = fmt::format("Reshape_for:{}", layer->GetName());
armnn::ReshapeDescriptor reshapeDescriptor;
reshapeDescriptor.m_TargetShape = reshapedTensorInfo.GetShape();
armnn::IConnectableLayer* reshapeLayer = m_Network->AddReshapeLayer(reshapeDescriptor,
reshapeLayerName.c_str());
reshapeLayer->GetOutputSlot(0).SetTensorInfo(reshapedTensorInfo);
reshapeLayer->GetOutputSlot(0).Connect(layer->GetInputSlot(0));
RegisterInputSlots(subgraphIndex, operatorIndex, reshapeLayer, {inputTensorIndexes[0]});
// Fc layer connects to the reshape layer, so we skip the first input slot when registering fc's input slots
tensorIndexesToRegister.erase(tensorIndexesToRegister.begin());
startingSlotIndex = 1;
}
RegisterInputSlots(subgraphIndex, operatorIndex, layer, tensorIndexesToRegister, startingSlotIndex);
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromShapes(subgraphIndex, operatorIndex, layer, 0,
{ inputTensorInfo.GetShape(),
filterTensorInfo.GetShape() });
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
if (outputTensorInfo.GetNumDimensions() > 2)
{
// Calculate reshape to flatten to 2D [batch_size, input_size]
std::vector<unsigned int> reshapedDimensions(2);
reshapedDimensions[1] = filterTensorInfo.GetShape()[0];
reshapedDimensions[0] = outputTensorInfo.GetNumElements() / reshapedDimensions[1];
armnn::TensorInfo reshapedOutputTensorInfo = outputTensorInfo;
if (outputTensorInfo.GetNumElements() % reshapedDimensions[1] != 0)
{
throw ParseException(
fmt::format("Failed to deduce output tensor shape from filter size {} {}",
reshapedDimensions[1],
CHECK_LOCATION().AsString()));
}
reshapedOutputTensorInfo.SetShape(armnn::TensorShape{ 2, reshapedDimensions.data() });
layer->GetOutputSlot(0).SetTensorInfo(reshapedOutputTensorInfo);
std::string reshapeLayerName = fmt::format("ExpandDims:{}:{}", subgraphIndex, operatorIndex);
layer = AddReshapeLayer(layer, 0, reshapeLayerName, outputTensorInfo);
}
// we need to add the activation layer and fortunately we don't need to care about the data layout
armnn::IConnectableLayer* fusedActivationLayer = AddFusedActivationLayer(layer, 0,
options->fused_activation_function);
// register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, fusedActivationLayer, {outputTensorIndexes[0]});
m_TensorInfos[outputTensorIndexes[0]] = layer->GetOutputSlot(0).GetTensorInfo();
}
void TfLiteParserImpl::ParseDetectionPostProcess(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 4);
// Obtain custom options from flexbuffers
auto custom_options = operatorPtr->custom_options;
const flexbuffers::Map& m = flexbuffers::GetRoot(custom_options.data(), custom_options.size()).AsMap();
// Obtain descriptor information from tf lite
DetectionPostProcessDescriptor desc;
desc.m_MaxDetections = m["max_detections"].AsUInt32();
desc.m_MaxClassesPerDetection = m["max_classes_per_detection"].AsUInt32();
desc.m_NmsScoreThreshold = m["nms_score_threshold"].AsFloat();
desc.m_NmsIouThreshold = m["nms_iou_threshold"].AsFloat();
desc.m_NumClasses = m["num_classes"].AsUInt32();
desc.m_ScaleH = m["h_scale"].AsFloat();
desc.m_ScaleW = m["w_scale"].AsFloat();
desc.m_ScaleX = m["x_scale"].AsFloat();
desc.m_ScaleY = m["y_scale"].AsFloat();
if (!(m["use_regular_nms"].IsNull()))
{
desc.m_UseRegularNms = m["use_regular_nms"].AsBool();
}
if (!(m["detections_per_class"].IsNull()))
{
desc.m_DetectionsPerClass = m["detections_per_class"].AsUInt32();
}
if (desc.m_NmsIouThreshold <= 0.0f || desc.m_NmsIouThreshold > 1.0f)
{
throw InvalidArgumentException("DetectionPostProcessTFLiteParser: Intersection over union threshold "
"must be positive and less than or equal to 1.");
}
armnn::TensorInfo anchorTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 2);
auto anchorTensorAndData = CreateConstTensorNonPermuted(inputs[2], anchorTensorInfo);
auto layerName = fmt::format("DetectionPostProcess:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddDetectionPostProcessLayer(desc, anchorTensorAndData,
layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
// The model does not specify the output shapes.
// The output shapes are calculated from the max_detection and max_classes_per_detection.
unsigned int numDetectedBox = desc.m_MaxDetections * desc.m_MaxClassesPerDetection;
m_OverriddenOutputShapes.push_back({ 1, numDetectedBox, 4 });
m_OverriddenOutputShapes.push_back({ 1, numDetectedBox });
m_OverriddenOutputShapes.push_back({ 1, numDetectedBox });
m_OverriddenOutputShapes.push_back({ 1 });
for (unsigned int i = 0 ; i < outputs.size() ; ++i)
{
armnn::TensorInfo detectionBoxOutputTensorInfo = ToTensorInfo(outputs[i], m_OverriddenOutputShapes[i]);
layer->GetOutputSlot(i).SetTensorInfo(detectionBoxOutputTensorInfo);
}
// Register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
// Register the output connection slots for the layer, connections are made after all layers have been created
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0],
outputTensorIndexes[1],
outputTensorIndexes[2],
outputTensorIndexes[3]});
}
/// The TfLite Pack operator is equivalent to the ArmNN Stack operator
void TfLiteParserImpl::ParsePack(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
if (inputs.size() < 1)
{
throw ParseException("Pack must have at least one input.");
}
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsPackOptions();
StackDescriptor desc;
desc.m_Axis = static_cast<uint32_t>(options->axis);
desc.m_NumInputs = static_cast<uint32_t>(inputs.size());
// Use the tensor shape of the first input as the "correct" input shape in the descriptor
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
desc.m_InputShape = inputTensorInfo.GetShape();
auto layerName = fmt::format("Pack:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddStackLayer(desc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseUnidirectionalSequenceLSTM(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
if (inputs.size() < 2)
{
throw ParseException("UnidirectionalSequenceLSTM must have at least 2 input.");
}
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto& subgraphPtr = m_Model->subgraphs[subgraphIndex];
const auto nodeParams = operatorPtr->builtin_options.AsUnidirectionalSequenceLSTMOptions();
CHECK_SUPPORTED_FUSED_ACTIVATION(nodeParams, subgraphIndex, operatorIndex);
auto inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
auto outputTensorInfo = ToTensorInfo(outputs[0]);
// Set the params structure for the AddUnidirectionalSequenceLstmLayer call
// Please refer to each operand at
// https://www.tensorflow.org/mlir/tfl_ops#tflunidirectional_sequence_lstm_tflunidirectionalsequencelstmop
armnn::LstmInputParams params;
if (IsOptionalOperandPresent(operatorPtr->inputs[1]))
{
params.m_InputToInputWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[1]].get(),
inputTensorInfo).first;
}
params.m_InputToForgetWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[2]].get(),
inputTensorInfo).first;
params.m_InputToCellWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[3]].get(),
inputTensorInfo).first;
params.m_InputToOutputWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[4]].get(),
inputTensorInfo).first;
// Recurrent weight tensors of size {n_cell, n_output}
if (IsOptionalOperandPresent(operatorPtr->inputs[5]))
{
params.m_RecurrentToInputWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[5]].get(),
inputTensorInfo).first;
}
params.m_RecurrentToForgetWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[6]].get(),
inputTensorInfo).first;
params.m_RecurrentToCellWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[7]].get(),
inputTensorInfo).first;
params.m_RecurrentToOutputWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[8]].get(),
inputTensorInfo).first;
// Peephole weights tensors of size {n_cell}, representing a diagonal matrix.
if (IsOptionalOperandPresent(operatorPtr->inputs[9]))
{
params.m_CellToInputWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[9]].get(),
inputTensorInfo).first;
}
if (IsOptionalOperandPresent(operatorPtr->inputs[10]))
{
params.m_CellToForgetWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[10]].get(),
inputTensorInfo).first;
}
if (IsOptionalOperandPresent(operatorPtr->inputs[11]))
{
params.m_CellToOutputWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[11]].get(),
inputTensorInfo).first;
}
// Gates bias tensors of size {n_cell}
if (IsOptionalOperandPresent(operatorPtr->inputs[12]))
{
params.m_InputGateBias = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[12]].get(),
inputTensorInfo).first;
}
params.m_ForgetGateBias = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[13]].get(),
inputTensorInfo).first;
params.m_CellBias = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[14]].get(),
inputTensorInfo).first;
params.m_OutputGateBias = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[15]].get(),
inputTensorInfo).first;
// Projection weight tensor of size {n_output, n_cell}
if (IsOptionalOperandPresent(operatorPtr->inputs[16]))
{
params.m_ProjectionWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[16]].get(),
inputTensorInfo).first;
}
// Projection bias tensor of size {n_output}
if (IsOptionalOperandPresent(operatorPtr->inputs[17]))
{
params.m_ProjectionBias = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[17]].get(),
inputTensorInfo).first;
}
// These state tensors are defined as variable tensors, and will be modified by this op.
armnn::TensorInfo outputStateInInfo = ToTensorInfo(subgraphPtr->tensors[operatorPtr->inputs[18]].get());
m_ConstantsToBeCreated.push_back(operatorPtr->inputs[18]);
armnn::TensorInfo cellStateInInfo = ToTensorInfo(subgraphPtr->tensors[operatorPtr->inputs[19]].get());
m_ConstantsToBeCreated.push_back(operatorPtr->inputs[19]);
// Layer norm coefficient tensors of size {n_cell}, representing a diagonal matrix.
if (inputs.size() >= 21 && IsOptionalOperandPresent(operatorPtr->inputs[20]))
{
params.m_InputLayerNormWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[20]].get(),
inputTensorInfo).first;
}
if (inputs.size() >= 22 && IsOptionalOperandPresent(operatorPtr->inputs[21]))
{
params.m_ForgetLayerNormWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[21]].get(),
inputTensorInfo).first;
}
if (inputs.size() >= 23 && IsOptionalOperandPresent(operatorPtr->inputs[22]))
{
params.m_CellLayerNormWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[22]].get(),
inputTensorInfo).first;
}
if (inputs.size() >= 24 && IsOptionalOperandPresent(operatorPtr->inputs[23]))
{
params.m_OutputLayerNormWeights = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->inputs[23]].get(),
inputTensorInfo).first;
}
// set the layer descriptor
armnn::UnidirectionalSequenceLstmDescriptor desc;
desc.m_ActivationFunc = nodeParams->fused_activation_function;
desc.m_ClippingThresCell = nodeParams->cell_clip;
desc.m_ClippingThresProj = nodeParams->proj_clip;
desc.m_CifgEnabled = (params.m_InputToInputWeights == nullptr
|| params.m_RecurrentToInputWeights == nullptr
|| params.m_InputGateBias == nullptr);
desc.m_PeepholeEnabled = (params.m_CellToForgetWeights != nullptr || params.m_CellToOutputWeights != nullptr);
desc.m_ProjectionEnabled = (params.m_ProjectionWeights != nullptr);
desc.m_LayerNormEnabled = (params.m_InputLayerNormWeights != nullptr
|| params.m_ForgetLayerNormWeights != nullptr
|| params.m_CellLayerNormWeights != nullptr
|| params.m_OutputLayerNormWeights != nullptr);
desc.m_TimeMajor = nodeParams->time_major;
if (operatorPtr->intermediates.size() > 3 && desc.m_LayerNormEnabled)
{
auto inputIntermediate = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->intermediates[0]].get(),
inputTensorInfo).first;
auto inputIntermediateTensorInfo = inputIntermediate->GetInfo();
desc.m_InputIntermediateScale = inputIntermediateTensorInfo.GetQuantizationScale();
auto forgetIntermediate = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->intermediates[1]].get(),
inputTensorInfo).first;
auto forgetIntermediateTensorInfo = forgetIntermediate->GetInfo();
desc.m_ForgetIntermediateScale = forgetIntermediateTensorInfo.GetQuantizationScale();
auto cellIntermediate = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->intermediates[2]].get(),
inputTensorInfo).first;
auto cellIntermediateTensorInfo = cellIntermediate->GetInfo();
desc.m_CellIntermediateScale = cellIntermediateTensorInfo.GetQuantizationScale();
auto outputIntermediate = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->intermediates[3]].get(),
inputTensorInfo).first;
auto outputIntermediateTensorInfo = outputIntermediate->GetInfo();
desc.m_OutputIntermediateScale = outputIntermediateTensorInfo.GetQuantizationScale();
}
else
{
float defaultIntermediate = std::pow(2, -12);
desc.m_InputIntermediateScale = defaultIntermediate;
desc.m_ForgetIntermediateScale = defaultIntermediate;
desc.m_CellIntermediateScale = defaultIntermediate;
desc.m_OutputIntermediateScale = defaultIntermediate;
}
if (operatorPtr->intermediates.size() > 4)
{
auto hiddentensor = CreateConstTensorPtr(subgraphPtr->tensors[operatorPtr->intermediates[4]].get(),
inputTensorInfo).first;
desc.m_HiddenStateScale = hiddentensor->GetInfo().GetQuantizationScale();
desc.m_HiddenStateZeroPoint = hiddentensor->GetInfo().GetQuantizationOffset();
}
unsigned int batchSize = desc.m_TimeMajor ? inputTensorInfo.GetShape()[1] : inputTensorInfo.GetShape()[0];
unsigned int outputSize = outputTensorInfo.GetShape()[2];
unsigned int numUnits = cellStateInInfo.GetShape()[1];
armnn::DataType dataType = inputTensorInfo.GetDataType();
float qScale = inputTensorInfo.GetQuantizationScale();
float qOffset = inputTensorInfo.GetQuantizationOffset();
armnn::TensorInfo scratchBufferTensorInfo({batchSize, numUnits * 3}, dataType, qScale, qOffset);
if (!desc.m_CifgEnabled)
{
scratchBufferTensorInfo = armnn::TensorInfo({batchSize, numUnits * 4}, dataType, qScale, qOffset);
}
armnn::TensorInfo cellStateOutTensorInfo({batchSize, numUnits},
cellStateInInfo.GetDataType(),
cellStateInInfo.GetQuantizationScale(),
cellStateInInfo.GetQuantizationOffset());
armnn::TensorInfo outputStateOutTensorInfo({batchSize, outputSize}, dataType, qScale, qOffset);
armnn::LstmInputParamsInfo paramsInfo;
paramsInfo.m_InputToForgetWeights = &(params.m_InputToForgetWeights->GetInfo());
paramsInfo.m_InputToCellWeights = &(params.m_InputToCellWeights->GetInfo());
paramsInfo.m_InputToOutputWeights = &(params.m_InputToOutputWeights->GetInfo());
paramsInfo.m_RecurrentToForgetWeights = &(params.m_RecurrentToForgetWeights->GetInfo());
paramsInfo.m_RecurrentToCellWeights = &(params.m_RecurrentToCellWeights->GetInfo());
paramsInfo.m_RecurrentToOutputWeights = &(params.m_RecurrentToOutputWeights->GetInfo());
paramsInfo.m_ForgetGateBias = &(params.m_ForgetGateBias->GetInfo());
paramsInfo.m_CellBias = &(params.m_CellBias->GetInfo());
paramsInfo.m_OutputGateBias = &(params.m_OutputGateBias->GetInfo());
if (!desc.m_CifgEnabled)
{
paramsInfo.m_InputToInputWeights = &(params.m_InputToInputWeights->GetInfo());
paramsInfo.m_RecurrentToInputWeights = &(params.m_RecurrentToInputWeights->GetInfo());
if (params.m_CellToInputWeights != nullptr)
{
paramsInfo.m_CellToInputWeights = &(params.m_CellToInputWeights->GetInfo());
}
paramsInfo.m_InputGateBias = &(params.m_InputGateBias->GetInfo());
}
if (desc.m_ProjectionEnabled)
{
paramsInfo.m_ProjectionWeights = &(params.m_ProjectionWeights->GetInfo());
if (params.m_ProjectionBias != nullptr)
{
paramsInfo.m_ProjectionBias = &(params.m_ProjectionBias->GetInfo());
}
}
if (desc.m_PeepholeEnabled)
{
paramsInfo.m_CellToForgetWeights = &(params.m_CellToForgetWeights->GetInfo());
paramsInfo.m_CellToOutputWeights = &(params.m_CellToOutputWeights->GetInfo());
}
if (desc.m_LayerNormEnabled)
{
if(!desc.m_CifgEnabled)
{
paramsInfo.m_InputLayerNormWeights = &(params.m_InputLayerNormWeights->GetInfo());
}
paramsInfo.m_ForgetLayerNormWeights = &(params.m_ForgetLayerNormWeights->GetInfo());
paramsInfo.m_CellLayerNormWeights = &(params.m_CellLayerNormWeights->GetInfo());
paramsInfo.m_OutputLayerNormWeights = &(params.m_OutputLayerNormWeights->GetInfo());
}
auto layerName = fmt::format("UnidirectionalSequenceLSTM:{}:{}", subgraphIndex, operatorIndex);
armnn::IConnectableLayer* layer = m_Network->AddUnidirectionalSequenceLstmLayer(desc, params);
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
// register the input connection slots for the layer, connections are made after all layers have been created
// only the tensors for the inputs are relevant, exclude the const tensors
auto inputTensorIndexes = AsUnsignedVector({operatorPtr->inputs[0],
operatorPtr->inputs[18],
operatorPtr->inputs[19]});
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0],
inputTensorIndexes[1],
inputTensorIndexes[2]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
layer->GetOutputSlot(0).SetTensorInfo(outputStateOutTensorInfo);
layer->GetOutputSlot(1).SetTensorInfo(cellStateOutTensorInfo);
layer->GetOutputSlot(2).SetTensorInfo(outputTensorInfo);
unsigned int tensorIndex = outputTensorIndexes[0];
armnn::IOutputSlot* slot = &(layer->GetOutputSlot(2));
RegisterProducerOfTensor(subgraphIndex, tensorIndex, slot);
}
void TfLiteParserImpl::ParseUnpack(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsUnpackOptions();
// This unpackAxis indicates the axis to unpack
const unsigned int unpackAxis = CHECKED_NON_NEGATIVE(options->axis);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
if (unpackAxis >= inputTensorInfo.GetNumDimensions())
{
throw ParseException(
fmt::format("The unpack axis: {} cannot be greater than or equal to "
"the number of input dimension {} {}",
unpackAxis,
inputTensorInfo.GetNumDimensions(),
CHECK_LOCATION().AsString()));
}
unsigned int unpackNum = CHECKED_NON_NEGATIVE(options->num);
// If num is not defined, automatically infer from the length of the dimension axis.
if(unpackNum == 0)
{
unpackNum = inputTensorInfo.GetShape()[unpackAxis];
}
// If unpack number cannot be inferred and is still zero, throw ParseException.
if(unpackNum == 0)
{
throw ParseException("Number to unpack must greater than zero.");
}
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), unpackNum);
auto inputDimSize = inputTensorInfo.GetNumDimensions();
std::vector<unsigned int> unpackDimSizes(inputDimSize);
// Add current input shape to unpackDimSizes
for (unsigned int i = 0; i < inputDimSize; ++i)
{
unpackDimSizes[i] = inputTensorInfo.GetShape()[i];
}
if (unpackDimSizes[unpackAxis] != unpackNum)
{
throw ParseException("Number to unpack must be the same as length of the dimension to "
"unpack along.");
}
unpackDimSizes[unpackAxis] /= unpackNum;
SplitterDescriptor splitDesc(unpackNum, static_cast<unsigned int>(unpackDimSizes.size()));
for (unsigned int j = 0; j < unpackNum; ++j)
{
// Set the size of the views.
for (unsigned int dimIdx = 0; dimIdx < unpackDimSizes.size(); ++dimIdx)
{
splitDesc.SetViewSize(j, dimIdx, unpackDimSizes[dimIdx]);
}
splitDesc.SetViewOriginCoord(j, unpackAxis, unpackDimSizes[unpackAxis] * j);
}
splitDesc.SetAxis(unpackAxis);
auto layerName = fmt::format("Unpack:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddSplitterLayer(splitDesc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorShape splitOutShape = TensorShape(static_cast<unsigned int>(unpackDimSizes.size()),
unpackDimSizes.data());
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
std::vector<unsigned int> reshapeDims;
for (unsigned int axis = 0; axis < splitOutShape.GetNumDimensions(); ++axis)
{
if (axis != unpackAxis)
{
reshapeDims.push_back(splitOutShape[axis]);
}
}
TensorShape reshapeOutputShape(splitOutShape.GetNumDimensions() -1, reshapeDims.data());
// Create reshape to remove the unpacked dimension for unpack operator of each output from Splitter.
for (unsigned int k = 0; k < layer->GetNumOutputSlots(); ++k)
{
armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[k], true);
std::string reshapeLayerName = fmt::format("Reshape_for:{}", layer->GetName());
armnn::ReshapeDescriptor desc;
desc.m_TargetShape = reshapeOutputShape;
armnn::IConnectableLayer* reshapeLayer = m_Network->AddReshapeLayer(desc, layerName.c_str());
layer->GetOutputSlot(k).SetTensorInfo(armnn::TensorInfo(splitOutShape,
outputTensorInfo.GetDataType(),
outputTensorInfo.GetQuantizationScale(),
outputTensorInfo.GetQuantizationOffset()));
layer->GetOutputSlot(k).Connect(reshapeLayer->GetInputSlot(0));
reshapeLayer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
uint32_t reshapedOutputId = CHECKED_NON_NEGATIVE(operatorPtr->outputs[k]);
armnn::IOutputSlot* slot = &(reshapeLayer->GetOutputSlot(0));
RegisterProducerOfTensor(subgraphIndex, reshapedOutputId, slot);
}
}
void TfLiteParserImpl::ParseSplit(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsSplitOptions();
const unsigned int numSplits = CHECKED_NON_NEGATIVE(options->num_splits);
// If number of splits cannot be inferred and is zero, throw ParseException.
if(numSplits == 0)
{
throw ParseException("Number to splits must greater than zero.");
}
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), numSplits);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
armnn::TensorInfo axisTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
if (axisTensorInfo.GetNumElements() != 1)
{
throw ParseException(fmt::format("Axis tensor can only have 1 element {}",
CHECK_LOCATION().AsString()));
}
BufferRawPtr axisBufferPtr = GetBuffer(m_Model, inputs[0]->buffer);
if (axisBufferPtr == nullptr)
{
throw ParseException(
fmt::format("Operation has invalid inputs. Failed to read axis. {}",
CHECK_LOCATION().AsString()));
}
std::vector<int32_t> axisData(axisTensorInfo.GetNumElements());
::memcpy(axisData.data(), axisBufferPtr->data.data(), axisTensorInfo.GetNumBytes());
int32_t axis = axisData[0];
auto inputDimensions = static_cast<int32_t>(inputTensorInfo.GetNumDimensions());
if (((axis < -inputDimensions) && (axis < 0)) || ((axis >= inputDimensions) && (axis > 0)))
{
// Square bracket denotes inclusive n while parenthesis denotes exclusive n
// E.g. Rank 4 tensor can have axis in range [-4, 3)
// -1 == 3, -2 == 2, -3 == 1, -4 == 0
throw ParseException(
fmt::format("Operation has invalid axis: {}. Axis must be in range [-n, n) {}",
axis,
CHECK_LOCATION().AsString()));
}
const unsigned int splitDim = armnnUtils::GetUnsignedAxis(inputTensorInfo.GetNumDimensions(), axis);
auto inputDimSize = inputTensorInfo.GetNumDimensions();
if (inputDimSize > MaxNumOfTensorDimensions)
{
throw ParseException(
fmt::format("The number of dimensions: {} for input tensors of the split op cannot be greater than {} {}",
inputTensorInfo.GetNumDimensions(),
MaxNumOfTensorDimensions,
CHECK_LOCATION().AsString()));
}
std::vector<unsigned int> splitterDimSizes(inputDimSize);
// Add current input shape to splitterDimSizes
for (unsigned int i = 0; i < inputDimSize; ++i)
{
splitterDimSizes[i] = inputTensorInfo.GetShape()[i];
}
if (splitterDimSizes[splitDim] % numSplits != 0)
{
throw ParseException("Number of splits must evenly divide the dimension");
}
splitterDimSizes[splitDim] /= numSplits;
SplitterDescriptor splitDesc(numSplits, inputDimSize);
for (unsigned int j = 0; j < numSplits; ++j)
{
// Set the size of the views.
for (unsigned int dimIdx = 0; dimIdx < splitterDimSizes.size(); ++dimIdx)
{
splitDesc.SetViewSize(j, dimIdx, splitterDimSizes[dimIdx]);
}
splitDesc.SetViewOriginCoord(j, splitDim, splitterDimSizes[splitDim] * j);
}
if (axisTensorInfo.GetNumElements() == 1)
{
splitDesc.SetAxis(axis);
}
auto layerName = fmt::format("Split:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddSplitterLayer(splitDesc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[1]});
for (unsigned int k = 0; k < layer->GetNumOutputSlots(); ++k)
{
armnn::TensorInfo tensorInfo = ToTensorInfo(outputs[k], true);
layer->GetOutputSlot(k).SetTensorInfo(tensorInfo);
}
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
unsigned int ComputeWrappedIndex(int idx, unsigned int numDimsIn)
{
int numDims = armnn::numeric_cast<int>(numDimsIn);
int v = idx < 0 ? numDims + idx : idx;
if (v < 0 || v > numDims)
{
throw ParseException(fmt::format("Unable to compute index {}", CHECK_LOCATION().AsString()));
}
return static_cast<unsigned int>(v);
}
void TfLiteParserImpl::ParseSplitV(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsSplitVOptions();
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 3);
auto& inputTensor = inputs[0];
auto& splitsTensor = inputs[1];
auto& axisTensor = inputs[2];
armnn::TensorInfo inputTensorInfo = ToTensorInfo(inputTensor);
armnn::TensorInfo splitsInfo = ToTensorInfo(splitsTensor);
armnn::TensorInfo axisTensorInfo = ToTensorInfo(axisTensor);
if (axisTensorInfo.GetNumElements() != 1)
{
throw ParseException(fmt::format("Axis tensor can only have 1 element {}",
CHECK_LOCATION().AsString()));
}
// Inputs
auto inputDimSize = inputTensorInfo.GetNumDimensions();
if (inputDimSize > MaxNumOfTensorDimensions)
{
throw ParseException(
fmt::format("The number of dimensions: {} for input tensors of the "
"SplitV op cannot be greater than {} {}",
inputTensorInfo.GetNumDimensions(),
MaxNumOfTensorDimensions,
CHECK_LOCATION().AsString()));
}
// Get split axis
BufferRawPtr axisBufferPtr = GetBuffer(m_Model, axisTensor->buffer);
if (axisBufferPtr == nullptr)
{
throw ParseException(
fmt::format("Operation has invalid inputs. Failed to read axis. {}",
CHECK_LOCATION().AsString()));
}
std::vector<int> axisData(axisTensorInfo.GetNumElements());
::memcpy(axisData.data(), axisBufferPtr->data.data(), axisTensorInfo.GetNumBytes());
int32_t axis = axisData[0];
auto inputDimensions = static_cast<int32_t>(inputTensorInfo.GetNumDimensions());
if (((axis < -inputDimensions) && (axis < 0)) || ((axis >= inputDimensions) && (axis > 0)))
{
// Square bracket denotes inclusive n while parenthesis denotes exclusive n
// E.g. Rank 4 tensor can have axis in range [-4, 3)
// -1 == 3, -2 == 2, -3 == 1, -4 == 0
throw ParseException(
fmt::format("Operation has invalid axis: {}. Axis must be in range [-n, n) {}",
axis,
CHECK_LOCATION().AsString()));
}
const unsigned int splitDim = ComputeWrappedIndex(axis, inputTensorInfo.GetNumDimensions());
// Set split sizes
CHECK_VALID_SIZE(splitsInfo.GetNumDimensions(), 1);
unsigned int numSplits{0};
if(options)
{
numSplits = CHECKED_NON_NEGATIVE(options->num_splits);
}
else
{
numSplits = splitsInfo.GetNumElements();
}
if (numSplits <=0)
{
throw ParseException("SplitV has invalid number of splits");
}
std::vector<int> splitsData(numSplits);
BufferRawPtr splitsBufferPtr = GetBuffer(m_Model, splitsTensor->buffer);
::memcpy(splitsData.data(), splitsBufferPtr->data.data(), splitsInfo.GetNumBytes());
unsigned int idx = 0;
int numInferred{0};
unsigned int inferIdx{0};
int splitSum{0};
for (auto split : splitsData)
{
if (split < 0)
{
numInferred++;
inferIdx = idx;
}
else
{
splitSum += split;
}
idx++;
}
// Check for inferred Axis
if (numInferred == 0)
{
if (splitSum != armnn::numeric_cast<int>(inputTensorInfo.GetShape()[splitDim]))
{
throw ParseException("SplitV split_sizes does not sum to the dimension of value along split_dim.");
}
}
else if (numInferred == 1)
{
splitsData[inferIdx] = armnn::numeric_cast<int>(inputTensorInfo.GetShape()[splitDim]) - splitSum;
}
else
{
throw ParseException("Cannot infer split size for more than one split");
}
//Ouput size validation
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), numSplits);
// Setup Armnn descriptor
SplitterDescriptor splitDesc(numSplits, inputDimSize);
unsigned int accumSplit = 0;
for (unsigned int j = 0; j < numSplits; ++j)
{
unsigned int splitSize = armnn::numeric_cast<unsigned int>(splitsData[j]);
// Set the size of the views.
for (unsigned int dimIdx = 0; dimIdx < inputTensorInfo.GetNumDimensions(); ++dimIdx)
{
unsigned int dimSize = inputTensorInfo.GetShape()[dimIdx];
if (dimIdx == splitDim)
{
dimSize = splitSize;
}
splitDesc.SetViewSize(j, dimIdx, dimSize);
}
splitDesc.SetViewOriginCoord(j, splitDim, accumSplit);
accumSplit += splitSize;
}
splitDesc.SetAxis(axis);
auto layerName = fmt::format("SplitV:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddSplitterLayer(splitDesc, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
for (unsigned int k = 0; k < layer->GetNumOutputSlots(); ++k)
{
armnn::TensorInfo tensorInfo = ToTensorInfo(outputs[k], true);
layer->GetOutputSlot(k).SetTensorInfo(tensorInfo);
}
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseArgMin(size_t subgraphIndex, size_t operatorIndex)
{
ParseArgMinMax(subgraphIndex, operatorIndex, armnn::ArgMinMaxFunction::Min);
}
void TfLiteParserImpl::ParseArgMax(size_t subgraphIndex, size_t operatorIndex)
{
ParseArgMinMax(subgraphIndex, operatorIndex, armnn::ArgMinMaxFunction::Max);
}
void TfLiteParserImpl::ParseArgMinMax(size_t subgraphIndex, size_t operatorIndex, ArgMinMaxFunction argMinMaxFunction)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo axisTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
if (axisTensorInfo.GetNumElements() != 1)
{
throw ParseException(fmt::format("Axis tensor can only have 1 element {}",
CHECK_LOCATION().AsString()));
}
// Check if output tensor type is Signed32 or Signed64
if (outputTensorInfo.GetDataType() != armnn::DataType::Signed32 &&
outputTensorInfo.GetDataType() != armnn::DataType::Signed64)
{
throw ParseException(
fmt::format(
"Output tensor data type is not supported. (Supported types: Signed32 & Signed64) {}",
CHECK_LOCATION().AsString()));
}
// Get const axis value from model and set it to descriptor.
BufferRawPtr axisBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
if (axisBufferPtr == nullptr)
{
throw ParseException(
fmt::format("Operation has invalid inputs. Failed to read axis. {}",
CHECK_LOCATION().AsString()));
}
std::vector<int32_t> axisData(axisTensorInfo.GetNumElements());
::memcpy(axisData.data(), axisBufferPtr->data.data(), axisTensorInfo.GetNumBytes());
int32_t axis = axisData.front();
auto inputDimensions = static_cast<int32_t>(inputTensorInfo.GetNumDimensions());
if (((axis < -inputDimensions) && (axis < 0)) || ((axis >= inputDimensions) && (axis > 0)))
{
// Square bracket denotes inclusive n while parenthesis denotes exclusive n
// E.g. Rank 4 tensor can have axis in range [-4, 3)
// -1 == 3, -2 == 2, -3 == 1, -4 == 0
throw ParseException(
fmt::format("Operation has invalid axis: {}. Axis must be in range [-n, n) {}",
axis,
CHECK_LOCATION().AsString()));
}
ArgMinMaxDescriptor desc;
desc.m_Axis = axis;
desc.m_Function = argMinMaxFunction;
// Register a ArgMin/ArgMax layer.
auto layerName = argMinMaxFunction == ArgMinMaxFunction::Max ? "ArgMax:{}:{}" : "ArgMin:{}:{}";
auto layerNameFormatted = fmt::format(layerName, subgraphIndex, operatorIndex);
IConnectableLayer *layer = m_Network->AddArgMinMaxLayer(desc, layerNameFormatted.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// Register input tensor to the layer.
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
// Register output tensor to the layer.
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseGather(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
TfLiteParserImpl::TensorRawPtrVector inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
TfLiteParserImpl::TensorRawPtrVector outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo indicesTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
armnn::TensorInfo outputTensorInfo = ToTensorInfo(outputs[0]);
armnn::GatherDescriptor gatherDescriptor;
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsGatherOptions();
auto axis = options->axis;
auto layerName = fmt::format("Gather:{}:{}", subgraphIndex, operatorIndex);
auto inputDimensions = static_cast<int32_t>(inputTensorInfo.GetNumDimensions());
auto indicesDimensions = indicesTensorInfo.GetNumDimensions();
auto outputDimensions = outputTensorInfo.GetNumDimensions();
if (((axis < -inputDimensions) && (axis < 0)) || ((axis >= inputDimensions) && (axis > 0)))
{
throw ParseException(
fmt::format("Operation has invalid axis: {} It is out of bounds [ -{}, {} ) {}",
axis,
inputDimensions, inputDimensions,
CHECK_LOCATION().AsString()));
}
if (outputDimensions != static_cast<unsigned int>(inputDimensions) + indicesDimensions - 1)
{
throw ParseException(
fmt::format("Operation has invalid output dimensions: {} Output must be an ({} + {} - 1) -D tensor {}",
outputDimensions,
inputDimensions, indicesDimensions,
CHECK_LOCATION().AsString()));
}
gatherDescriptor.m_Axis = axis;
IConnectableLayer* layer = m_Network->AddGatherLayer(gatherDescriptor, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseGatherNd(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
TfLiteParserImpl::TensorRawPtrVector inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
TfLiteParserImpl::TensorRawPtrVector outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo indicesTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
auto layerName = fmt::format("GatherNd:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddGatherNdLayer(layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseDepthToSpace(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
TfLiteParserImpl::TensorRawPtrVector inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
TfLiteParserImpl::TensorRawPtrVector outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::DepthToSpaceDescriptor descriptor;
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsDepthToSpaceOptions();
auto blockSize = options->block_size;
if (blockSize < 2)
{
throw ParseException(
fmt::format("Operation has invalid block size: {} Block size should be >= 2 {}",
blockSize,
CHECK_LOCATION().AsString()));
}
descriptor.m_BlockSize = armnn::numeric_cast<uint32_t>(blockSize);
auto layerName = fmt::format("DepthToSpace:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddDepthToSpaceLayer(descriptor, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseSum(size_t subgraphIndex, size_t operatorIndex)
{
ParseReduce(subgraphIndex, operatorIndex, armnn::ReduceOperation::Sum);
}
void TfLiteParserImpl::ParseReduceProd(size_t subgraphIndex, size_t operatorIndex)
{
ParseReduce(subgraphIndex, operatorIndex, armnn::ReduceOperation::Prod);
}
void TfLiteParserImpl::ParseReduceMax(size_t subgraphIndex, size_t operatorIndex)
{
ParseReduce(subgraphIndex, operatorIndex, armnn::ReduceOperation::Max);
}
void TfLiteParserImpl::ParseReduceMin(size_t subgraphIndex, size_t operatorIndex)
{
ParseReduce(subgraphIndex, operatorIndex, armnn::ReduceOperation::Min);
}
void TfLiteParserImpl::ParseReduce(size_t subgraphIndex, size_t operatorIndex, ReduceOperation reduceOperation)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsReducerOptions();
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Reduce:{}:{}", subgraphIndex, operatorIndex);
armnn::TensorInfo inputTensorInfo0 = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo inputTensorInfo1 = InputTensorInfo(subgraphIndex, operatorIndex, 1);
ReduceDescriptor desc;
BufferRawPtr axisBufferPtr = GetBuffer(m_Model, inputs[1]->buffer);
// Get const axis value from model and set it to descriptor.
if (axisBufferPtr != nullptr)
{
std::vector<int32_t> axisData(inputTensorInfo1.GetNumElements());
::memcpy(axisData.data(), axisBufferPtr->data.data(), inputTensorInfo1.GetNumBytes());
// Convert the axis to unsigned int and remove duplicates.
auto rank = static_cast<int32_t>(inputTensorInfo0.GetNumDimensions());
std::set<unsigned int> uniqueAxis;
std::transform(axisData.begin(),
axisData.end(),
std::inserter(uniqueAxis, uniqueAxis.begin()),
[rank](int i)->unsigned int{
return static_cast<uint32_t>(((i + rank) % rank)); });
desc.m_vAxis.assign(uniqueAxis.begin(), uniqueAxis.end());
}
else
{
for (uint32_t i = 0; i < inputTensorInfo0.GetNumDimensions(); ++i)
{
desc.m_vAxis.push_back(i);
}
}
desc.m_KeepDims = options->keep_dims;
desc.m_ReduceOperation = reduceOperation;
// Register a new layer object, Sum.
IConnectableLayer* layer = m_Network->AddReduceLayer(desc, layerName.c_str());
armnn::TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
// Register input tensor to the layer.
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
// Register output tensor to the layer.
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseLocalResponseNormalization(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("LRN:{}:{}", subgraphIndex, operatorIndex);
std::string layerNameFormatted = fmt::format(layerName, subgraphIndex, operatorIndex);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
const auto& operatorPtr = m_Model->subgraphs[subgraphIndex]->operators[operatorIndex];
const auto* options = operatorPtr->builtin_options.AsLocalResponseNormalizationOptions();
armnn::NormalizationDescriptor descriptor;
descriptor.m_DataLayout = armnn::DataLayout::NHWC;
descriptor.m_NormChannelType = armnn::NormalizationAlgorithmChannel::Across;
descriptor.m_NormMethodType = armnn::NormalizationAlgorithmMethod::LocalBrightness;
descriptor.m_NormSize = static_cast<uint32_t>(options->radius);
descriptor.m_K = options->bias;
descriptor.m_Alpha = options->alpha;
descriptor.m_Beta = options->beta;
// ArmNN expects normSize to be the full size of the normalization
// window rather than the radius as in TfLite.
descriptor.m_NormSize = 1 + (2 * descriptor.m_NormSize);
IConnectableLayer* layer = m_Network->AddNormalizationLayer(descriptor, layerNameFormatted.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseAbs(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::Abs);
}
void TfLiteParserImpl::ParseCeil(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::Ceil);
}
void TfLiteParserImpl::ParseExp(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::Exp);
}
void TfLiteParserImpl::ParseLog(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::Log);
}
void TfLiteParserImpl::ParseLogicalNot(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::LogicalNot);
}
void TfLiteParserImpl::ParseNeg(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::Neg);
}
void TfLiteParserImpl::ParsePower(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("Power:{}:{}", subgraphIndex, operatorIndex);
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
CheckMatchingQuantization(inputTensorInfo, input1TensorInfo, layerName, "Input 0", "Input 1");
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Power, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseRsqrt(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::Rsqrt);
}
void TfLiteParserImpl::ParseSin(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::Sin);
}
void TfLiteParserImpl::ParseSqrt(size_t subgraphIndex, size_t operatorIndex)
{
ParseElementwiseUnary(subgraphIndex, operatorIndex, armnn::UnaryOperation::Sqrt);
}
void TfLiteParserImpl::ParseSquare(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
auto layerName = fmt::format("Square:{}:{}", subgraphIndex, operatorIndex);
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::Mul, layerName.c_str());
ARMNN_ASSERT(layer != nullptr);
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 0});
CheckMatchingQuantization(inputTensorInfo, outputTensorInfo, layerName, "Input 0", "Output 0");
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseSquaredDifference(size_t subgraphIndex, size_t operatorIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = fmt::format("SquaredDifference:{}:{}", subgraphIndex, operatorIndex);
TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
IConnectableLayer* layer = m_Network->AddElementwiseBinaryLayer(BinaryOperation::SqDiff, layerName.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
void TfLiteParserImpl::ParseElementwiseUnary(size_t subgraphIndex, size_t operatorIndex, UnaryOperation unaryOperation)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 1);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
std::string layerName = std::string(GetUnaryOperationAsCString(unaryOperation)) + ":{}:{}";
std::string layerNameFormatted = fmt::format(layerName, subgraphIndex, operatorIndex);
ElementwiseUnaryDescriptor desc;
desc.m_Operation = unaryOperation;
IConnectableLayer* layer = m_Network->AddElementwiseUnaryLayer(desc, layerNameFormatted.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, outputTensorIndexes);
}
void TfLiteParserImpl::ParseEqual(size_t subgraphIndex, size_t operatorIndex)
{
ParseComparison(subgraphIndex, operatorIndex, armnn::ComparisonOperation::Equal);
}
void TfLiteParserImpl::ParseNotEqual(size_t subgraphIndex, size_t operatorIndex)
{
ParseComparison(subgraphIndex, operatorIndex, armnn::ComparisonOperation::NotEqual);
}
void TfLiteParserImpl::ParseGreater(size_t subgraphIndex, size_t operatorIndex)
{
ParseComparison(subgraphIndex, operatorIndex, armnn::ComparisonOperation::Greater);
}
void TfLiteParserImpl::ParseGreaterOrEqual(size_t subgraphIndex, size_t operatorIndex)
{
ParseComparison(subgraphIndex, operatorIndex, armnn::ComparisonOperation::GreaterOrEqual);
}
void TfLiteParserImpl::ParseLess(size_t subgraphIndex, size_t operatorIndex)
{
ParseComparison(subgraphIndex, operatorIndex, armnn::ComparisonOperation::Less);
}
void TfLiteParserImpl::ParseLessOrEqual(size_t subgraphIndex, size_t operatorIndex)
{
ParseComparison(subgraphIndex, operatorIndex, armnn::ComparisonOperation::LessOrEqual);
}
void TfLiteParserImpl::ParseComparison(size_t subgraphIndex, size_t operatorIndex,
ComparisonOperation comparisonOperation)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
auto inputs = GetInputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(inputs.size(), 2);
auto outputs = GetOutputs(m_Model, subgraphIndex, operatorIndex);
CHECK_VALID_SIZE(outputs.size(), 1);
auto layerName = std::string(GetComparisonOperationAsCString(comparisonOperation)) + ":{}:{}";
std::string layerNameFormatted = fmt::format(layerName, subgraphIndex, operatorIndex);
armnn::TensorInfo inputTensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 0);
armnn::TensorInfo input1TensorInfo = InputTensorInfo(subgraphIndex, operatorIndex, 1);
CheckMatchingQuantization(inputTensorInfo, input1TensorInfo, layerNameFormatted, "Input 0", "Input 1");
ComparisonDescriptor desc;
desc.m_Operation = comparisonOperation;
IConnectableLayer* layer = m_Network->AddComparisonLayer(desc, layerNameFormatted.c_str());
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
TensorInfo outputTensorInfo = OutputTensorInfoFromInputs(subgraphIndex, operatorIndex, layer, 0, {0, 1});
layer->GetOutputSlot(0).SetTensorInfo(outputTensorInfo);
auto inputTensorIndexes = AsUnsignedVector(GetInputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterInputSlots(subgraphIndex, operatorIndex, layer, {inputTensorIndexes[0], inputTensorIndexes[1]});
auto outputTensorIndexes = AsUnsignedVector(GetOutputTensorIds(m_Model, subgraphIndex, operatorIndex));
RegisterOutputSlots(subgraphIndex, operatorIndex, layer, {outputTensorIndexes[0]});
}
armnn::IConnectableLayer* TfLiteParserImpl::AddReshapeLayer(armnn::IConnectableLayer* layer,
unsigned int outputSlot,
std::string reshapeLayerName,
armnn::TensorInfo outputShape)
{
ReshapeDescriptor desc;
desc.m_TargetShape = outputShape.GetShape();
IConnectableLayer* reshapeLayer =
m_Network->AddReshapeLayer(desc, reshapeLayerName.c_str());
auto & prevOutputSlot = layer->GetOutputSlot(outputSlot);
prevOutputSlot.Connect(reshapeLayer->GetInputSlot(0));
reshapeLayer->GetOutputSlot(0).SetTensorInfo(outputShape);
return reshapeLayer;
}
armnn::IConnectableLayer* TfLiteParserImpl::AddFusedActivationLayer(armnn::IConnectableLayer* prevLayer,
unsigned int outputSlot,
tflite::ActivationFunctionType activationType)
{
ActivationDescriptor activationDesc;
std::string layerName = prevLayer->GetName();
switch(activationType)
{
case tflite::ActivationFunctionType_NONE:
{
// this is a no-op: return previous layer
return prevLayer;
}
case tflite::ActivationFunctionType_RELU:
{
activationDesc.m_Function = ActivationFunction::ReLu;
layerName += ":RELU";
break;
}
case tflite::ActivationFunctionType_RELU6:
{
activationDesc.m_Function = ActivationFunction::BoundedReLu;
activationDesc.m_A = 6.0f;
activationDesc.m_B = 0.0f;
layerName += ":RELU6";
break;
}
case tflite::ActivationFunctionType_TANH:
{
activationDesc.m_Function = ActivationFunction::TanH;
activationDesc.m_A = 1.0f;
activationDesc.m_B = 1.0f;
layerName += ":TANH";
break;
}
// I only put these here as a reminder what others we could support
case tflite::ActivationFunctionType_RELU_N1_TO_1:
case tflite::ActivationFunctionType_SIGN_BIT:
default:
{
throw ParseException(
fmt::format("TfLite parser doesn't support fused activation: "
"{}/{} {} ",
activationType,
tflite::EnumNameActivationFunctionType(activationType),
CHECK_LOCATION().AsString()));
}
}
IConnectableLayer* activationLayer =
m_Network->AddActivationLayer(activationDesc, layerName.c_str());
auto & prevOutputSlot = prevLayer->GetOutputSlot(outputSlot);
prevOutputSlot.Connect(activationLayer->GetInputSlot(0));
activationLayer->GetOutputSlot(0).SetTensorInfo(prevOutputSlot.GetTensorInfo());
return activationLayer;
}
armnn::IConnectableLayer* TfLiteParserImpl::AddFusedFloorLayer(armnn::IConnectableLayer* prevLayer,
unsigned int outputSlot)
{
auto& prevOutputSlot = prevLayer->GetOutputSlot(outputSlot);
DataType dataType = prevOutputSlot.GetTensorInfo().GetDataType();
if (dataType == DataType::Signed32)
{
return prevLayer;
}
std::string layerName = prevLayer->GetName();
IConnectableLayer* floorLayer = m_Network->AddFloorLayer(layerName.c_str());
prevOutputSlot.Connect(floorLayer->GetInputSlot(0));
floorLayer->GetOutputSlot(0).SetTensorInfo(prevOutputSlot.GetTensorInfo());
return floorLayer;
}
TfLiteParserImpl::ModelPtr TfLiteParserImpl::LoadModelFromFile(const char* fileName)
{
if (fileName == nullptr)
{
throw InvalidArgumentException(fmt::format("Invalid (null) file name {}",
CHECK_LOCATION().AsString()));
}
std::error_code errorCode;
fs::path pathToFile(fileName);
if (!fs::exists(pathToFile, errorCode))
{
//fmt::format() could not be used here (format error)
std::stringstream msg;
msg << "Cannot find the file (" << fileName << ") errorCode: " << errorCode
<< " " << CHECK_LOCATION().AsString();
throw FileNotFoundException(msg.str());
}
if (!fs::is_regular_file(pathToFile))
{
// Exclude non regular files.
throw InvalidArgumentException(fmt::format("File \"{}\" is not a regular file and cannot be loaded.",
pathToFile.c_str()));
}
std::ifstream file(fileName, std::ios::binary);
std::string fileContent((std::istreambuf_iterator<char>(file)), std::istreambuf_iterator<char>());
return LoadModelFromBinary(reinterpret_cast<const uint8_t *>(fileContent.c_str()),
fileContent.size());
}
TfLiteParserImpl::ModelPtr TfLiteParserImpl::LoadModelFromBinary(const uint8_t* binaryContent, size_t len)
{
if (binaryContent == nullptr)
{
throw InvalidArgumentException(fmt::format("Invalid (null) binary content {}",
CHECK_LOCATION().AsString()));
}
flatbuffers::Verifier verifier(binaryContent, len);
if (verifier.VerifyBuffer<tflite::Model>() == false)
{
throw ParseException(
fmt::format("Buffer doesn't conform to the expected Tensorflow Lite "
"flatbuffers format. size:{} {}",
len,
CHECK_LOCATION().AsString()));
}
return tflite::UnPackModel(binaryContent);
}
TfLiteParserImpl::TensorRawPtrVector TfLiteParserImpl::GetInputs(const ModelPtr& model,
size_t subgraphIndex,
size_t operatorIndex)
{
CHECK_MODEL(model, subgraphIndex, operatorIndex);
const auto& subgraphPtr = model->subgraphs[subgraphIndex];
const auto& operatorPtr = subgraphPtr->operators[operatorIndex];
size_t inputCount = operatorPtr->inputs.size();
TensorRawPtrVector result;
for (size_t i = 0; i < inputCount; ++i)
{
// If the input location is -1 then assume input is turned off.
if (operatorPtr->inputs[i] == -1)
{
continue;
}
else
{
uint32_t inputId = CHECKED_NON_NEGATIVE(operatorPtr->inputs[i]);
result.push_back(subgraphPtr->tensors[inputId].get());
}
}
return result;
}
TfLiteParserImpl::TensorRawPtrVector TfLiteParserImpl::GetOutputs(const ModelPtr& model,
size_t subgraphIndex,
size_t operatorIndex)
{
CHECK_MODEL(model, subgraphIndex, operatorIndex);
const auto& subgraphPtr = model->subgraphs[subgraphIndex];
const auto& operatorPtr = subgraphPtr->operators[operatorIndex];
size_t outputCount = operatorPtr->outputs.size();
TensorRawPtrVector result(outputCount);
for (size_t i = 0; i < outputCount; ++i)
{
uint32_t outputId = CHECKED_NON_NEGATIVE(operatorPtr->outputs[i]);
CHECK_TENSOR(model, subgraphIndex, outputId);
result[i] = subgraphPtr->tensors[outputId].get();
}
return result;
}
TfLiteParserImpl::TensorIdRawPtrVector TfLiteParserImpl::GetSubgraphInputs(const ModelPtr& model,
size_t subgraphIndex)
{
CHECK_SUBGRAPH(model, subgraphIndex);
const auto& subgraphPtr = model->subgraphs[subgraphIndex];
size_t inputCount = subgraphPtr->inputs.size();
TensorIdRawPtrVector result(inputCount);
for (size_t i = 0; i < inputCount; ++i)
{
uint32_t inputId = CHECKED_NON_NEGATIVE(subgraphPtr->inputs[i]);
CHECK_TENSOR(model, subgraphIndex, inputId);
result[i] = std::make_pair(inputId, subgraphPtr->tensors[inputId].get());
}
return result;
}
TfLiteParserImpl::TensorIdRawPtrVector TfLiteParserImpl::GetSubgraphOutputs(const ModelPtr& model,
size_t subgraphIndex)
{
CHECK_SUBGRAPH(model, subgraphIndex);
const auto& subgraphPtr = model->subgraphs[subgraphIndex];
size_t outputCount = subgraphPtr->outputs.size();
TensorIdRawPtrVector result(outputCount);
for (size_t i = 0; i < outputCount; ++i)
{
uint32_t outputId = CHECKED_NON_NEGATIVE(subgraphPtr->outputs[i]);
result[i] = std::make_pair(outputId, subgraphPtr->tensors[outputId].get());
}
return result;
}
std::vector<int32_t>& TfLiteParserImpl::GetInputTensorIds(const ModelPtr& model,
size_t subgraphIndex,
size_t operatorIndex)
{
CHECK_MODEL(model, subgraphIndex, operatorIndex);
const auto& subgraphPtr = model->subgraphs[subgraphIndex];
const auto& operatorPtr = subgraphPtr->operators[operatorIndex];
return operatorPtr->inputs;
}
std::vector<int32_t>& TfLiteParserImpl::GetOutputTensorIds(const ModelPtr& model,
size_t subgraphIndex,
size_t operatorIndex)
{
CHECK_MODEL(model, subgraphIndex, operatorIndex);
const auto& subgraphPtr = model->subgraphs[subgraphIndex];
const auto& operatorPtr = subgraphPtr->operators[operatorIndex];
return operatorPtr->outputs;
}
void TfLiteParserImpl::RegisterInputSlots(size_t subgraphIndex,
size_t operatorIndex,
IConnectableLayer* layer,
const std::vector<unsigned int>& tensorIndexes,
unsigned int startingSlotIndex)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
if (tensorIndexes.size() + startingSlotIndex != layer->GetNumInputSlots())
{
throw ParseException(
fmt::format("The number of tensor inputs ({}) does not match the number expected ({})"
" for subgraph:{} operator index:{} {}",
tensorIndexes.size(),
layer->GetNumInputSlots(),
subgraphIndex,
operatorIndex,
CHECK_LOCATION().AsString()));
}
for (unsigned int index = 0; index < tensorIndexes.size() ; ++index)
{
unsigned int tensorIndex = tensorIndexes[index];
armnn::IInputSlot* slot = &(layer->GetInputSlot(startingSlotIndex + index));
RegisterConsumerOfTensor(subgraphIndex, tensorIndex, slot);
}
}
void TfLiteParserImpl::RegisterOutputSlots(size_t subgraphIndex,
size_t operatorIndex,
IConnectableLayer* layer,
const std::vector<unsigned int>& tensorIndexes)
{
CHECK_MODEL(m_Model, subgraphIndex, operatorIndex);
if (!layer)
{
throw NullPointerException(fmt::format("Layer {} pointer is null {}",
operatorIndex, CHECK_LOCATION().AsString()));
}
if (tensorIndexes.size() != layer->GetNumOutputSlots())
{
throw ParseException(
fmt::format("The number of tensor outputs ({}) does not match the number expected ({})"
" for subgraph:{} operator index:{} {}",
tensorIndexes.size(),
layer->GetNumOutputSlots(),
subgraphIndex,
operatorIndex,
CHECK_LOCATION().AsString()));
}
for (unsigned int slotIndex = 0; slotIndex < layer->GetNumOutputSlots(); ++slotIndex)
{
unsigned int tensorIndex = tensorIndexes[slotIndex];
armnn::IOutputSlot* slot = &(layer->GetOutputSlot(slotIndex));
RegisterProducerOfTensor(subgraphIndex, tensorIndex, slot);
}
}
void TfLiteParserImpl::SetupInputLayerTensorInfos(size_t subgraphIndex)
{
CHECK_SUBGRAPH(m_Model, subgraphIndex);
auto inputs = GetSubgraphInputs(m_Model, subgraphIndex);
for (auto const& tensorIdAndPtr : inputs)
{
auto tensorInfo = ToTensorInfo(tensorIdAndPtr.second);
m_TensorInfos.insert({tensorIdAndPtr.first, tensorInfo});
}
}
void TfLiteParserImpl::SetupInputLayers(size_t subgraphIndex)
{
CHECK_SUBGRAPH(m_Model, subgraphIndex);
auto inputs = GetSubgraphInputs(m_Model, subgraphIndex);
for (auto const& tensorIdAndPtr : inputs)
{
auto bindingId = GenerateLayerBindingId(subgraphIndex, tensorIdAndPtr.first);
IConnectableLayer* layer =
m_Network->AddInputLayer(bindingId, tensorIdAndPtr.second->name.c_str());
auto tensorInfo = ToTensorInfo(tensorIdAndPtr.second);
layer->GetOutputSlot(0).SetTensorInfo(tensorInfo);
RegisterOutputSlots(subgraphIndex,
VIRTUAL_OPERATOR_ID,
layer,
{ static_cast<uint32_t>(tensorIdAndPtr.first) });
}
}
void TfLiteParserImpl::SetupOutputLayers(size_t subgraphIndex)
{
CHECK_SUBGRAPH(m_Model, subgraphIndex);
auto outputs = GetSubgraphOutputs(m_Model, subgraphIndex);
for (auto const& tensorIdAndPtr : outputs)
{
auto bindingId = GenerateLayerBindingId(subgraphIndex, tensorIdAndPtr.first);
IConnectableLayer* layer =
m_Network->AddOutputLayer(bindingId, tensorIdAndPtr.second->name.c_str());
RegisterInputSlots(subgraphIndex,
VIRTUAL_OPERATOR_ID,
layer,
{ static_cast<uint32_t>(tensorIdAndPtr.first) });
}
}
void TfLiteParserImpl::SetupConstantLayerTensorInfos(size_t subgraph)
{
CHECK_SUBGRAPH(m_Model, subgraph);
const auto & subgraphPtr = m_Model->subgraphs[subgraph];
for (unsigned int subgraphIndex = 0; subgraphIndex < m_SubgraphConnections.size(); ++subgraphIndex)
{
for (unsigned int tensorIndex = 0; tensorIndex < m_SubgraphConnections[subgraphIndex].size(); ++tensorIndex)
{
if (m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot == nullptr &&
m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots.size() > 0)
{
TensorRawPtr tensorPtr = subgraphPtr->tensors[tensorIndex].get();
armnn::TensorInfo tensorInfo = ToTensorInfo(tensorPtr);
m_TensorInfos.insert({tensorIndex, tensorInfo});
}
}
}
}
void TfLiteParserImpl::SetupConstantLayers(size_t subgraph)
{
CHECK_SUBGRAPH(m_Model, subgraph);
const auto & subgraphPtr = m_Model->subgraphs[subgraph];
for (unsigned int subgraphIndex = 0; subgraphIndex < m_SubgraphConnections.size(); ++subgraphIndex)
{
for (unsigned int tensorIndex = 0; tensorIndex < m_SubgraphConnections[subgraphIndex].size(); ++tensorIndex)
{
if (m_SubgraphConnections[subgraphIndex][tensorIndex].outputSlot == nullptr &&
m_SubgraphConnections[subgraphIndex][tensorIndex].inputSlots.size() > 0)
{
TensorRawPtr tensorPtr = subgraphPtr->tensors[tensorIndex].get();
if (IsConstTensor(tensorPtr))
{
armnn::TensorInfo tensorInfo = ToTensorInfo(tensorPtr);
armnn::DataType dataType = tensorInfo.GetDataType();
if (std::find(m_ConstantsToDequantize.begin(), m_ConstantsToDequantize.end(), tensorPtr->buffer)
!= m_ConstantsToDequantize.end())
{
dataType = DataType::Float32;
}
auto tensorAndData = CreateConstTensorNonPermuted(tensorPtr, tensorInfo, dataType);
std::string layerName = fmt::format("Constant:{}", tensorPtr->name);
IConnectableLayer *layer = m_Network->AddConstantLayer(tensorAndData.first, layerName.c_str());
layer->GetOutputSlot(0).SetTensorInfo(tensorAndData.first.GetInfo());
RegisterOutputSlots(subgraphIndex,
VIRTUAL_OPERATOR_ID,
layer,
{ tensorIndex });
}
else if (ShouldConstantTensorBeCreated(tensorIndex))
{
armnn::TensorInfo tensorInfo = ToTensorInfo(tensorPtr);
armnn::DataType dataType = tensorInfo.GetDataType();
if (std::find(m_ConstantsToDequantize.begin(), m_ConstantsToDequantize.end(), tensorPtr->buffer)
!= m_ConstantsToDequantize.end())
{
dataType = DataType::Float32;
}
// Make sure isConstant flag is set.
tensorInfo.SetConstant();
tensorInfo.SetDataType(dataType);
auto tensorAndData = ConstTensor(tensorInfo, std::vector<uint8_t>(tensorInfo.GetNumBytes()));
std::string layerName = fmt::format("Constant:{}", tensorPtr->name);
IConnectableLayer* layer = m_Network->AddConstantLayer(tensorAndData, layerName.c_str());
layer->GetOutputSlot(0).SetTensorInfo(tensorInfo);
RegisterOutputSlots(subgraphIndex,
VIRTUAL_OPERATOR_ID,
layer,
{tensorIndex});
}
else
{
throw ParseException(
fmt::format("Invalid Tensor: Tensor should be constant. {}",
CHECK_LOCATION().AsString()));
}
}
}
}
}
// example usage: BufferRawPtr bufferPtr = GetBuffer(m_Model, inputs[0]->buffer);
TfLiteParserImpl::BufferRawPtr TfLiteParserImpl::GetBuffer(const ModelPtr& model, size_t bufferIndex)
{
CHECK_BUFFER(model, bufferIndex);
return model->buffers[bufferIndex].get();
}
template<typename T>
std::pair<armnn::ConstTensor, TfLiteParserImpl::SupportedDataStorage>
TfLiteParserImpl::CreateConstTensorAndStoreData(TfLiteParserImpl::BufferRawPtr bufferPtr,
TfLiteParserImpl::TensorRawPtr tensorPtr,
armnn::TensorInfo& tensorInfo,
armnn::Optional<armnn::PermutationVector&> permutationVector)
{
// Make sure isConstant flag is set.
tensorInfo.SetConstant();
auto constData = CreateConstTensorImpl<T>(bufferPtr,
tensorPtr,
tensorInfo,
permutationVector);
TfLiteParserImpl::SupportedDataStorage storage(std::move(constData.second));
return std::make_pair(constData.first, std::move(storage));
}
bool TfLiteParserImpl::ShouldConstantTensorBeCreated(unsigned int tensorIndex)
{
// If the TensorIndex appears in the list of ConstantsToBeCreated then return true
return (std::find(m_ConstantsToBeCreated.begin(), m_ConstantsToBeCreated.end(), tensorIndex)
!= m_ConstantsToBeCreated.end());
}
bool TfLiteParserImpl::IsConstTensor(TensorRawPtr tensorPtr)
{
CHECK_TENSOR_PTR(tensorPtr);
bool isConst = true;
auto buffer = GetBuffer(m_Model, tensorPtr->buffer);
if (buffer->data.size() == 0)
{
isConst = false;
}
return isConst;
}
std::pair<armnn::ConstTensor, TfLiteParserImpl::SupportedDataStorage>
TfLiteParserImpl::CreateConstTensorPermuted(TensorRawPtr tensorPtr,
armnn::TensorInfo& tensorInfo,
armnn::Optional<armnn::PermutationVector&> permutationVector)
{
CHECK_TENSOR_PTR(tensorPtr);
auto bufferPtr = GetBuffer(m_Model, tensorPtr->buffer);
CHECK_BUFFER_SIZE(bufferPtr, tensorInfo, tensorPtr->buffer);
// Make sure isConstant flag is set.
tensorInfo.SetConstant();
switch (tensorInfo.GetDataType())
{
case armnn::DataType::Float32:
return CreateConstTensorAndStoreData<float>(bufferPtr,
tensorPtr,
tensorInfo,
permutationVector);
case armnn::DataType::QAsymmU8:
return CreateConstTensorAndStoreData<uint8_t>(bufferPtr,
tensorPtr,
tensorInfo,
permutationVector);
case armnn::DataType::QSymmS8:
return CreateConstTensorAndStoreData<int8_t>(bufferPtr,
tensorPtr,
tensorInfo,
permutationVector);
case armnn::DataType::QAsymmS8:
return CreateConstTensorAndStoreData<int8_t>(bufferPtr,
tensorPtr,
tensorInfo,
permutationVector);
case armnn::DataType::Signed32:
return CreateConstTensorAndStoreData<int32_t>(bufferPtr,
tensorPtr,
tensorInfo,
permutationVector);
default:
{
std::stringstream errString;
errString << "Unexpected datatype when creating const tensor: "
<< armnn::GetDataTypeName(tensorInfo.GetDataType())
<< " shape:" << tensorInfo.GetShape()
<< CHECK_LOCATION().AsString();
throw ParseException(errString.str());
}
}
}
armnn::ConstTensor TfLiteParserImpl::CreateConstTensorNonPermuted(TensorRawPtr tensorPtr,
armnn::TensorInfo& tensorInfo)
{
CHECK_TENSOR_PTR(tensorPtr);
auto bufferPtr = GetBuffer(m_Model, tensorPtr->buffer);
CHECK_BUFFER_SIZE(bufferPtr, tensorInfo, tensorPtr->buffer);
// Make sure isConstant flag is set.
tensorInfo.SetConstant();
return ConstTensor(tensorInfo, bufferPtr->data.data());
}
std::pair<armnn::ConstTensor, std::unique_ptr<float[]>>
TfLiteParserImpl::CreateConstTensorNonPermuted(TensorRawPtr tensorPtr,
armnn::TensorInfo& tensorInfo,
armnn::DataType inputDataType)
{
CHECK_TENSOR_PTR(tensorPtr);
auto bufferPtr = GetBuffer(m_Model, tensorPtr->buffer);
CHECK_BUFFER_SIZE(bufferPtr, tensorInfo, tensorPtr->buffer);
// Make sure isConstant flag is set.
tensorInfo.SetConstant();
if (inputDataType == DataType::Float32 && tensorInfo.GetDataType() != DataType::Float32)
{
try
{
TensorInfo constTensorInfo(tensorInfo.GetShape(), DataType::Float32, 0.0f, 0, true);
std::unique_ptr<float[]> data = armnnUtils::ToFloatArray(bufferPtr->data, tensorInfo);
return std::make_pair(ConstTensor(constTensorInfo, data.get()), std::move(data));
}
catch (InvalidArgumentException&)
{
throw ParseException(
fmt::format("Unsupported input/weights combination: Input {} not supported with Weights {}",
GetDataTypeName(DataType::Float32),
GetDataTypeName(tensorInfo.GetDataType()),
CHECK_LOCATION().AsString()));
}
}
else
{
return std::make_pair(ConstTensor(tensorInfo, bufferPtr->data.data()), std::unique_ptr<float[]>());
}
}
std::pair<armnn::ConstTensor*, std::unique_ptr<float[]>>
TfLiteParserImpl::CreateConstTensorPtr(TensorRawPtr tensorPtr, armnn::TensorInfo& inputTensorInfo)
{
CHECK_TENSOR_PTR(tensorPtr);
armnn::TensorInfo tensorInfo = ToTensorInfo(tensorPtr);
auto bufferPtr = GetBuffer(m_Model, tensorPtr->buffer);
CHECK_BUFFER_SIZE(bufferPtr, tensorInfo, tensorPtr->buffer);
// Make sure isConstant flag is set.
tensorInfo.SetConstant();
if (inputTensorInfo.GetDataType() == DataType::Float32 && tensorInfo.GetDataType() != DataType::Float32)
{
try
{
TensorInfo constTensorInfo(tensorInfo.GetShape(), DataType::Float32, 0.0f, 0, true);
std::unique_ptr<float[]> data = armnnUtils::ToFloatArray(bufferPtr->data, tensorInfo);
return std::make_pair(new ConstTensor(constTensorInfo, data.get()), std::move(data));
}
catch (InvalidArgumentException&)
{
throw ParseException(
fmt::format("Unsupported input/weights combination: Input {} not supported with Weights {}",
GetDataTypeName(DataType::Float32),
GetDataTypeName(tensorInfo.GetDataType()),
CHECK_LOCATION().AsString()));
}
}
else
{
return std::make_pair(new ConstTensor(tensorInfo, bufferPtr->data.data()), std::unique_ptr<float[]>());
}
}
BindingPointInfo TfLiteParserImpl::GetNetworkInputBindingInfo(size_t subgraphId,
const std::string& name) const
{
CHECK_SUBGRAPH(m_Model, subgraphId);
auto inputs = GetSubgraphInputs(m_Model, subgraphId);
for (auto const& input : inputs)
{
if (input.second->name == name)
{
auto bindingId = GenerateLayerBindingId(subgraphId, input.first);
auto inputTensorInfo = ToTensorInfo(input.second);
// Input tensors are always treated as constant tensors during network execution.
inputTensorInfo.SetConstant(true);
return std::make_pair(bindingId, inputTensorInfo);
}
}
std::stringstream bindings;
for (auto const& input : inputs)
{
bindings << "'" << input.second->name << "' ";
}
throw ParseException(
fmt::format("No input binding found for subgraph:{} and name:{}. "
"Possible inputs are: [{}] {}",
subgraphId,
name,
bindings.str(),
CHECK_LOCATION().AsString()));
}
BindingPointInfo TfLiteParserImpl::GetNetworkOutputBindingInfo(size_t subgraphId,
const std::string& name) const
{
CHECK_SUBGRAPH(m_Model, subgraphId);
auto outputs = GetSubgraphOutputs(m_Model, subgraphId);
for (unsigned int i = 0; i < outputs.size(); ++i)
{
auto const output = outputs[i];
if (output.second->name == name)
{
auto bindingId = GenerateLayerBindingId(subgraphId, output.first);
std::vector<unsigned int> shape = m_OverriddenOutputShapes.size() > 0 ?
m_OverriddenOutputShapes[i] : AsUnsignedVector(output.second->shape);
return std::make_pair(bindingId, ToTensorInfo(output.second, shape));
}
}
std::stringstream bindings;
for (auto const& output : outputs)
{
bindings << "'" << output.second->name << "' ";
}
throw ParseException(
fmt::format("No output binding found for subgraph:{} and name:{}. "
"Possible outputs are: [{}] {}",
subgraphId,
name,
bindings.str(),
CHECK_LOCATION().AsString()));
}
size_t TfLiteParserImpl::GetSubgraphCount() const
{
return m_Model->subgraphs.size();
}
std::vector<std::string> TfLiteParserImpl::GetSubgraphInputTensorNames(size_t subgraphId) const
{
CHECK_SUBGRAPH(m_Model, subgraphId);
auto inputs = GetSubgraphInputs(m_Model, subgraphId);
std::vector<std::string> result;
result.reserve(inputs.size());
for (auto const& input : inputs)
{
result.push_back(input.second->name);
}
return result;
}
std::vector<std::string> TfLiteParserImpl::GetSubgraphOutputTensorNames(size_t subgraphId) const
{
CHECK_SUBGRAPH(m_Model, subgraphId);
auto outputs = GetSubgraphOutputs(m_Model, subgraphId);
std::vector<std::string> result;
result.reserve(outputs.size());
for (auto const& output : outputs)
{
result.push_back(output.second->name);
}
return result;
}
const std::string TfLiteParserImpl::GetVersion()
{
return TFLITE_PARSER_VERSION;
}
TfLiteParserImpl::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<float[]>&& data)
: m_FloatData(std::move(data))
, m_Uint8Data(nullptr)
, m_Int8Data(nullptr)
, m_Int32Data(nullptr)
{
}
TfLiteParserImpl::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<uint8_t[]>&& data)
: m_FloatData(nullptr)
, m_Uint8Data(std::move(data))
, m_Int8Data(nullptr)
, m_Int32Data(nullptr)
{
}
TfLiteParserImpl::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<int8_t[]>&& data)
: m_FloatData(nullptr)
, m_Uint8Data(nullptr)
, m_Int8Data(std::move(data))
, m_Int32Data(nullptr)
{
}
TfLiteParserImpl::SupportedDataStorage::SupportedDataStorage(std::unique_ptr<int32_t[]>&& data)
: m_FloatData(nullptr)
, m_Uint8Data(nullptr)
, m_Int8Data(nullptr)
, m_Int32Data(std::move(data))
{
}
} // armnnTfLiteParser