Blame - delegate/src/test/QuantizationTestHelper.hpp - ml/armnn

Matthew Sloyan

0d35a93

2020-11-09 12:25:05 +0000

[diff] [blame]

1

//

2

3

// SPDX-License-Identifier: MIT

//

#pragma once

#include <armnn_delegate.hpp>

9

10

#include <flatbuffers/flatbuffers.h>

11

#include <tensorflow/lite/interpreter.h>

12

#include <tensorflow/lite/kernels/register.h>

13

#include <tensorflow/lite/model.h>

14

#include <tensorflow/lite/schema/schema_generated.h>

15

#include <tensorflow/lite/version.h>

16

17

#include <doctest/doctest.h>

namespace

{

std::vector<char> CreateQuantizationTfLiteModel(tflite::BuiltinOperator quantizationOperatorCode,

23

tflite::TensorType inputTensorType,

24

tflite::TensorType outputTensorType,

25

const std::vector <int32_t>& inputTensorShape,

26

const std::vector <int32_t>& outputTensorShape,

27

float quantScale = 1.0f,

28

int quantOffset = 0)

29

{

30

using namespace tflite;

31

flatbuffers::FlatBufferBuilder flatBufferBuilder;

32

33

std::vector<flatbuffers::Offset<tflite::Buffer>> buffers;

34

buffers.push_back(CreateBuffer(flatBufferBuilder, flatBufferBuilder.CreateVector({})));

35

36

auto quantizationParameters =

37

CreateQuantizationParameters(flatBufferBuilder,

38

0,

39

0,

40

flatBufferBuilder.CreateVector<float>({ quantScale }),

41

flatBufferBuilder.CreateVector<int64_t>({ quantOffset }),

42

QuantizationDetails_CustomQuantization);

43

44

std::array<flatbuffers::Offset<Tensor>, 2> tensors;

45

tensors[0] = CreateTensor(flatBufferBuilder,

46

flatBufferBuilder.CreateVector<int32_t>(inputTensorShape.data(),

47

inputTensorShape.size()),

48

inputTensorType,

49

0,

50

flatBufferBuilder.CreateString("input"),

51

quantizationParameters);

52

tensors[1] = CreateTensor(flatBufferBuilder,

53

flatBufferBuilder.CreateVector<int32_t>(outputTensorShape.data(),

54

outputTensorShape.size()),

55

outputTensorType,

56

0,

57

flatBufferBuilder.CreateString("output"),

58

quantizationParameters);

59

60

// create operator

61

tflite::BuiltinOptions operatorBuiltinOptionsType = tflite::BuiltinOptions_NONE;

62

flatbuffers::Offset<void> operatorBuiltinOptions = 0;

63

switch (quantizationOperatorCode)

64

{

65

case BuiltinOperator_QUANTIZE:

66

{

67

operatorBuiltinOptionsType = BuiltinOptions_QuantizeOptions;

68

operatorBuiltinOptions = CreateQuantizeOptions(flatBufferBuilder).Union();

69

break;

70

}

71

case BuiltinOperator_DEQUANTIZE:

72

{

73

operatorBuiltinOptionsType = BuiltinOptions_DequantizeOptions;

74

operatorBuiltinOptions = CreateDequantizeOptions(flatBufferBuilder).Union();

break;

}

default:

break;

}

Keith Davis

2020-11-26 17:40:35 +0000

[diff] [blame]

81

const std::vector<int32_t> operatorInputs{0};

82

const std::vector<int32_t> operatorOutputs{1};

Matthew Sloyan

0d35a93

2020-11-09 12:25:05 +0000

[diff] [blame]

83

flatbuffers::Offset <Operator> quantizationOperator =

84

CreateOperator(flatBufferBuilder,

85

0,

86

flatBufferBuilder.CreateVector<int32_t>(operatorInputs.data(), operatorInputs.size()),

87

flatBufferBuilder.CreateVector<int32_t>(operatorOutputs.data(), operatorOutputs.size()),

88

operatorBuiltinOptionsType,

89

operatorBuiltinOptions);

90

Keith Davis

892fafe

2020-11-26 17:40:35 +0000

[diff] [blame]

91

const std::vector<int> subgraphInputs{0};

92

const std::vector<int> subgraphOutputs{1};

Matthew Sloyan

0d35a93

2020-11-09 12:25:05 +0000

[diff] [blame]

93

flatbuffers::Offset <SubGraph> subgraph =

94

CreateSubGraph(flatBufferBuilder,

95

flatBufferBuilder.CreateVector(tensors.data(), tensors.size()),

96

flatBufferBuilder.CreateVector<int32_t>(subgraphInputs.data(), subgraphInputs.size()),

97

flatBufferBuilder.CreateVector<int32_t>(subgraphOutputs.data(), subgraphOutputs.size()),

98

flatBufferBuilder.CreateVector(&quantizationOperator, 1));

99

100

flatbuffers::Offset <flatbuffers::String> modelDescription =

101

flatBufferBuilder.CreateString("ArmnnDelegate: Quantization Operator Model");

102

flatbuffers::Offset <OperatorCode> operatorCode = CreateOperatorCode(flatBufferBuilder, quantizationOperatorCode);

103

104

flatbuffers::Offset <Model> flatbufferModel =

105

CreateModel(flatBufferBuilder,

106

TFLITE_SCHEMA_VERSION,

107

flatBufferBuilder.CreateVector(&operatorCode, 1),

108

flatBufferBuilder.CreateVector(&subgraph, 1),

109

modelDescription,

110

flatBufferBuilder.CreateVector(buffers.data(), buffers.size()));

111

112

flatBufferBuilder.Finish(flatbufferModel);

113

114

return std::vector<char>(flatBufferBuilder.GetBufferPointer(),

115

flatBufferBuilder.GetBufferPointer() + flatBufferBuilder.GetSize());

116

}

117

118

template <typename InputT, typename OutputT>

119

void QuantizationTest(tflite::BuiltinOperator quantizeOperatorCode,

120

tflite::TensorType inputTensorType,

121

tflite::TensorType outputTensorType,

122

std::vector<armnn::BackendId>& backends,

123

std::vector<int32_t>& inputShape,

124

std::vector<int32_t>& outputShape,

125

std::vector<InputT>& inputValues,

126

std::vector<OutputT>& expectedOutputValues,

127

float quantScale = 1.0f,

128

int quantOffset = 0)

129

{

130

using namespace tflite;

131

std::vector<char> modelBuffer = CreateQuantizationTfLiteModel(quantizeOperatorCode,

inputTensorType,

outputTensorType,

inputShape,

outputShape,

quantScale,

quantOffset);

const Model* tfLiteModel = GetModel(modelBuffer.data());

140

141

// Create TfLite Interpreters

142

std::unique_ptr<Interpreter> armnnDelegateInterpreter;

143

CHECK(InterpreterBuilder(tfLiteModel, ::tflite::ops::builtin::BuiltinOpResolver())

144

(&armnnDelegateInterpreter) == kTfLiteOk);

145

CHECK(armnnDelegateInterpreter != nullptr);

146

CHECK(armnnDelegateInterpreter->AllocateTensors() == kTfLiteOk);

147

148

std::unique_ptr<Interpreter> tfLiteInterpreter;

149

CHECK(InterpreterBuilder(tfLiteModel, ::tflite::ops::builtin::BuiltinOpResolver())

150

(&tfLiteInterpreter) == kTfLiteOk);

151

CHECK(tfLiteInterpreter != nullptr);

152

CHECK(tfLiteInterpreter->AllocateTensors() == kTfLiteOk);

153

154

// Create the ArmNN Delegate

155

armnnDelegate::DelegateOptions delegateOptions(backends);

156

std::unique_ptr<TfLiteDelegate, decltype(&armnnDelegate::TfLiteArmnnDelegateDelete)>

157

theArmnnDelegate(armnnDelegate::TfLiteArmnnDelegateCreate(delegateOptions),

158

armnnDelegate::TfLiteArmnnDelegateDelete);

159

CHECK(theArmnnDelegate != nullptr);

160

161

// Modify armnnDelegateInterpreter to use armnnDelegate

162

CHECK(armnnDelegateInterpreter->ModifyGraphWithDelegate(theArmnnDelegate.get()) == kTfLiteOk);

163

164

// Set input data

165

auto tfLiteDelegateInputId = tfLiteInterpreter->inputs()[0];

166

auto tfLiteDelageInputData = tfLiteInterpreter->typed_tensor<InputT>(tfLiteDelegateInputId);

167

for (unsigned int i = 0; i < inputValues.size(); ++i)

168

{

169

tfLiteDelageInputData[i] = inputValues[i];

170

}

171

172

auto armnnDelegateInputId = armnnDelegateInterpreter->inputs()[0];

173

auto armnnDelegateInputData = armnnDelegateInterpreter->typed_tensor<InputT>(armnnDelegateInputId);

174

for (unsigned int i = 0; i < inputValues.size(); ++i)

175

{

176

armnnDelegateInputData[i] = inputValues[i];

}

// Run EnqueWorkload

CHECK(tfLiteInterpreter->Invoke() == kTfLiteOk);

181

CHECK(armnnDelegateInterpreter->Invoke() == kTfLiteOk);

182

183

// Compare output data

184

auto tfLiteDelegateOutputId = tfLiteInterpreter->outputs()[0];

185

auto tfLiteDelageOutputData = tfLiteInterpreter->typed_tensor<OutputT>(tfLiteDelegateOutputId);

186

auto armnnDelegateOutputId = armnnDelegateInterpreter->outputs()[0];

187

auto armnnDelegateOutputData = armnnDelegateInterpreter->typed_tensor<OutputT>(armnnDelegateOutputId);

188

189

for (size_t i = 0; i < expectedOutputValues.size(); i++)

190

{

191

CHECK(expectedOutputValues[i] == armnnDelegateOutputData[i]);

192

CHECK(tfLiteDelageOutputData[i] == expectedOutputValues[i]);

193

CHECK(tfLiteDelageOutputData[i] == armnnDelegateOutputData[i]);

}

}

} // anonymous namespace