Blame - src/backends/aclCommon/ArmComputeTensorUtils.hpp - ml/armnn

2018-03-09 14:13:49 +0000

[diff] [blame]

1

//

2

David Beck

ecb56cd

2018-09-05 12:52:57 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

//

#pragma once

#include <armnn/Tensor.hpp>

8

#include <armnn/DescriptorsFwd.hpp>

9

10

#include <arm_compute/core/ITensor.h>

11

#include <arm_compute/core/TensorInfo.h>

surmeh01

3537c2c

2018-05-18 16:31:43 +0100

[diff] [blame]

12

#include <arm_compute/core/Types.h>

Sadik Armagan

f446432

2018-12-20 16:19:12 +0000

[diff] [blame]

13

#include <arm_compute/core/Size2D.h>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

14

Mike Kelly

0a08ec6

2019-07-25 08:39:31 +0100

[diff] [blame]

15

#include <Half.hpp>

16

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

17

#include <boost/cast.hpp>

namespace armnn

{

class ITensorHandle;

namespace armcomputetensorutils

24

{

25

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

26

/// Utility function to map an armnn::DataType to corresponding arm_compute::DataType.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

27

arm_compute::DataType GetArmComputeDataType(armnn::DataType dataType);

28

Matthew Bentham

fd89996

2018-12-31 15:49:42 +0000

[diff] [blame]

29

/// Utility function used to set up an arm_compute::Coordinates from a vector of ArmNN Axes for reduction functions

30

arm_compute::Coordinates BuildArmComputeReductionCoordinates(size_t inputDimensions,

31

unsigned int originalInputRank,

32

const std::vector<unsigned int>& armnnAxes);

33

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

34

/// Utility function used to setup an arm_compute::TensorShape object from an armnn::TensorShape.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

35

arm_compute::TensorShape BuildArmComputeTensorShape(const armnn::TensorShape& tensorShape);

36

37

/// Utility function used to setup an arm_compute::ITensorInfo object whose dimensions are based on the given

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

38

/// armnn::ITensorInfo.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

39

arm_compute::TensorInfo BuildArmComputeTensorInfo(const armnn::TensorInfo& tensorInfo);

40

Francis Murtagh

351d13d

2018-09-24 15:01:18 +0100

[diff] [blame]

41

/// Utility function used to setup an arm_compute::ITensorInfo object whose dimensions are based on the given

42

/// armnn::ITensorInfo.

43

/// armnn::DataLayout.

44

arm_compute::TensorInfo BuildArmComputeTensorInfo(const armnn::TensorInfo& tensorInfo,

45

armnn::DataLayout dataLayout);

46

Matteo Martincigh

747ef82

2018-12-18 09:26:39 +0000

[diff] [blame]

47

/// Utility function used to convert armnn::DataLayout to arm_compute::DataLayout

48

/// armnn::DataLayout.

49

arm_compute::DataLayout ConvertDataLayout(armnn::DataLayout dataLayout);

50

Sadik Armagan

a3600ba

2019-10-10 10:43:20 +0100

[diff] [blame]

51

/// Utility function used to setup an arm_compute::PoolingLayerInfo object from given

52

/// armnn::Pooling2dDescriptor

53

/// bool fpMixedPrecision

54

arm_compute::PoolingLayerInfo BuildArmComputePoolingLayerInfo(const Pooling2dDescriptor& descriptor,

55

bool fpMixedPrecision = false);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

56

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

57

/// Utility function to setup an arm_compute::NormalizationLayerInfo object from an armnn::NormalizationDescriptor.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

58

arm_compute::NormalizationLayerInfo BuildArmComputeNormalizationLayerInfo(const NormalizationDescriptor& desc);

59

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

60

/// Utility function used to setup an arm_compute::PermutationVector object from an armnn::PermutationVector.

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

61

arm_compute::PermutationVector BuildArmComputePermutationVector(const armnn::PermutationVector& vector);

62

Sadik Armagan

f446432

2018-12-20 16:19:12 +0000

[diff] [blame]

63

/// Utility function used to setup an arm_compute::Size2D object from width and height values.

64

arm_compute::Size2D BuildArmComputeSize2D(const unsigned int width, const unsigned int height);

65

Mike Kelly

0a08ec6

2019-07-25 08:39:31 +0100

[diff] [blame]

66

/// Gets the appropriate PixelValue for the input DataType

67

arm_compute::PixelValue GetPixelValue(arm_compute::ITensor& input, float pixelValue);

68

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

69

/// Utility function used to setup an arm_compute::PadStrideInfo object from an armnn layer descriptor.

surmeh01

3537c2c

2018-05-18 16:31:43 +0100

[diff] [blame]

70

template <typename Descriptor>

71

arm_compute::PadStrideInfo BuildArmComputePadStrideInfo(const Descriptor &descriptor)

72

{

73

return arm_compute::PadStrideInfo(descriptor.m_StrideX,

74

descriptor.m_StrideY,

75

descriptor.m_PadLeft,

76

descriptor.m_PadRight,

77

descriptor.m_PadTop,

78

descriptor.m_PadBottom,

79

arm_compute::DimensionRoundingType::FLOOR);

80

}

81

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

82

/// Sets up the given ArmCompute tensor's dimensions based on the given ArmNN tensor.

83

template <typename Tensor>

84

void BuildArmComputeTensor(Tensor& tensor, const armnn::TensorInfo& tensorInfo)

85

{

86

tensor.allocator()->init(BuildArmComputeTensorInfo(tensorInfo));

87

}

88

Francis Murtagh

351d13d

2018-09-24 15:01:18 +0100

[diff] [blame]

89

/// Sets up the given ArmCompute tensor's dimensions based on the given ArmNN tensor.

90

template <typename Tensor>

91

void BuildArmComputeTensor(Tensor& tensor, const armnn::TensorInfo& tensorInfo, DataLayout dataLayout)

92

{

93

tensor.allocator()->init(BuildArmComputeTensorInfo(tensorInfo, dataLayout));

94

}

95

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

96

template <typename Tensor>

97

void InitialiseArmComputeTensorEmpty(Tensor& tensor)

98

{

99

tensor.allocator()->allocate();

100

}

101

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

102

/// Utility function to free unused tensors after a workload is configured and prepared

103

template <typename Tensor>

104

void FreeTensorIfUnused(std::unique_ptr<Tensor>& tensor)

105

{

106

if (tensor && !tensor->is_used())

107

{

108

tensor.reset(nullptr);

}

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

112

// Helper function to obtain byte offset into tensor data

113

inline size_t GetTensorOffset(const arm_compute::ITensorInfo& info,

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

114

uint32_t depthIndex,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

115

uint32_t batchIndex,

116

uint32_t channelIndex,

uint32_t y,

uint32_t x)

{

arm_compute::Coordinates coords;

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

121

coords.set(4, static_cast<int>(depthIndex));

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

122

coords.set(3, static_cast<int>(batchIndex));

123

coords.set(2, static_cast<int>(channelIndex));

124

coords.set(1, static_cast<int>(y));

125

coords.set(0, static_cast<int>(x));

Jammy Zhou

d80cc0c

2019-10-21 16:44:40 +0800

[diff] [blame]

126

return boost::numeric_cast<size_t>(info.offset_element_in_bytes(coords));

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

127

}

128

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

129

// Helper function to obtain element offset into data buffer representing tensor data (assuming no strides).

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

130

inline size_t GetLinearBufferOffset(const arm_compute::ITensorInfo& info,

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

131

uint32_t depthIndex,

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

132

uint32_t batchIndex,

133

uint32_t channelIndex,

uint32_t y,

uint32_t x)

{

const arm_compute::TensorShape& shape = info.tensor_shape();

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

138

uint32_t width = static_cast<uint32_t>(shape[0]);

139

uint32_t height = static_cast<uint32_t>(shape[1]);

140

uint32_t numChannels = static_cast<uint32_t>(shape[2]);

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

141

uint32_t numBatches = static_cast<uint32_t>(shape[3]);

142

return (((depthIndex * numBatches + batchIndex) * numChannels + channelIndex) * height + y) * width + x;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

143

}

144

145

template <typename T>

146

void CopyArmComputeITensorData(const arm_compute::ITensor& srcTensor, T* dstData)

147

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

148

// If MaxNumOfTensorDimensions is increased, this loop will need fixing.

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

149

static_assert(MaxNumOfTensorDimensions == 5, "Please update CopyArmComputeITensorData");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

150

{

151

const arm_compute::ITensorInfo& info = *srcTensor.info();

152

const arm_compute::TensorShape& shape = info.tensor_shape();

153

const uint8_t* const bufferPtr = srcTensor.buffer();

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

154

uint32_t width = static_cast<uint32_t>(shape[0]);

155

uint32_t height = static_cast<uint32_t>(shape[1]);

156

uint32_t numChannels = static_cast<uint32_t>(shape[2]);

157

uint32_t numBatches = static_cast<uint32_t>(shape[3]);

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

158

uint32_t depth = static_cast<uint32_t>(shape[4]);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

159

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

160

for (unsigned int depthIndex = 0; depthIndex < depth; ++depthIndex)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

161

{

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

162

for (unsigned int batchIndex = 0; batchIndex < numBatches; ++batchIndex)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

163

{

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

164

for (unsigned int channelIndex = 0; channelIndex < numChannels; ++channelIndex)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

165

{

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

166

for (unsigned int y = 0; y < height; ++y)

167

{

168

// Copies one row from arm_compute tensor buffer to linear memory buffer.

169

// A row is the largest contiguous region we can copy, as the tensor data may be using strides.

170

memcpy(

171

dstData + GetLinearBufferOffset(info, depthIndex, batchIndex, channelIndex, y, 0),

172

bufferPtr + GetTensorOffset(info, depthIndex, batchIndex, channelIndex, y, 0),

173

width * sizeof(T));

174

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

}

}

}

template <typename T>

182

void CopyArmComputeITensorData(const T* srcData, arm_compute::ITensor& dstTensor)

183

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

184

// If MaxNumOfTensorDimensions is increased, this loop will need fixing.

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

185

static_assert(MaxNumOfTensorDimensions == 5, "Please update CopyArmComputeITensorData");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

186

{

187

const arm_compute::ITensorInfo& info = *dstTensor.info();

188

const arm_compute::TensorShape& shape = info.tensor_shape();

189

uint8_t* const bufferPtr = dstTensor.buffer();

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

190

uint32_t width = static_cast<uint32_t>(shape[0]);

191

uint32_t height = static_cast<uint32_t>(shape[1]);

192

uint32_t numChannels = static_cast<uint32_t>(shape[2]);

193

uint32_t numBatches = static_cast<uint32_t>(shape[3]);

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

194

uint32_t depth = static_cast<uint32_t>(shape[4]);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

195

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

196

for (unsigned int depthIndex = 0; depthIndex < depth; ++depthIndex)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

197

{

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

198

for (unsigned int batchIndex = 0; batchIndex < numBatches; ++batchIndex)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

199

{

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

200

for (unsigned int channelIndex = 0; channelIndex < numChannels; ++channelIndex)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

201

{

Matthew Jackson

2019-08-15 15:14:18 +0100

[diff] [blame]

202

for (unsigned int y = 0; y < height; ++y)

203

{

204

// Copies one row from linear memory buffer to arm_compute tensor buffer.

205

// A row is the largest contiguous region we can copy, as the tensor data may be using strides.

206

memcpy(

207

bufferPtr + GetTensorOffset(info, depthIndex, batchIndex, channelIndex, y, 0),

208

srcData + GetLinearBufferOffset(info, depthIndex, batchIndex, channelIndex, y, 0),

209

width * sizeof(T));

210

}

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

}

}

}

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

217

/// Construct a TensorShape object from an ArmCompute object based on arm_compute::Dimensions.

218

/// \tparam ArmComputeType Any type that implements the Dimensions interface

219

/// \tparam T Shape value type

220

/// \param shapelike An ArmCompute object that implements the Dimensions interface

221

/// \param initial A default value to initialise the shape with

222

/// \return A TensorShape object filled from the Acl shapelike object.

223

template<typename ArmComputeType, typename T>

224

TensorShape GetTensorShape(const ArmComputeType& shapelike, T initial)

225

{

226

std::vector<unsigned int> s(MaxNumOfTensorDimensions, initial);

227

for (unsigned int i=0; i < shapelike.num_dimensions(); ++i)

228

{

229

s[(shapelike.num_dimensions()-1)-i] = boost::numeric_cast<unsigned int>(shapelike[i]);

230

}

231

return TensorShape(boost::numeric_cast<unsigned int>(shapelike.num_dimensions()), s.data());

232

};

233

234

/// Get the strides from an ACL strides object

235

inline TensorShape GetStrides(const arm_compute::Strides& strides)

236

{

237

return GetTensorShape(strides, 0U);

238

}

239

240

/// Get the shape from an ACL shape object

241

inline TensorShape GetShape(const arm_compute::TensorShape& shape)

242

{

243

return GetTensorShape(shape, 1U);

244

}

245

Aron Virginas-Tar

710f664

2019-11-27 14:48:32 +0000

[diff] [blame^]

246

bool IsQuantMultiplierSupported(const TensorInfo& input,

247

const TensorInfo& output,

248

const TensorInfo& weights);

249

telsoa01