Blame - src/backends/neon/workloads/NeonDepthwiseConvolutionWorkload.cpp - ml/armnn

2018-03-09 14:13:49 +0000

[diff] [blame]

1

//

2

David Beck

ecb56cd

2018-09-05 12:52:57 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

4

//

5

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

6

#include "NeonDepthwiseConvolutionWorkload.hpp"

7

Matthew Bentham

d80a712

2019-01-08 17:52:37 +0000

[diff] [blame]

8

#include "NeonWorkloadUtils.hpp"

9

10

#include <DataLayoutIndexed.hpp>

Aron Virginas-Tar

c9cc804

2018-11-01 16:15:57 +0000

[diff] [blame]

11

#include <aclCommon/ArmComputeTensorUtils.hpp>

12

#include <neon/NeonLayerSupport.hpp>

13

#include <backendsCommon/CpuTensorHandle.hpp>

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

14

#include <backendsCommon/WorkloadUtils.hpp>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

15

Matthew Bentham

d80a712

2019-01-08 17:52:37 +0000

[diff] [blame]

16

#include <arm_compute/runtime/NEON/functions/NEDepthwiseConvolutionLayer.h>

17

18

using namespace armnnUtils;

19

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

20

namespace armnn

21

{

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

22

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

23

using namespace armcomputetensorutils;

24

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

25

arm_compute::Status NeonDepthwiseConvolutionWorkloadValidate(const TensorInfo& input,

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

26

const TensorInfo& output,

27

const DepthwiseConvolution2dDescriptor& descriptor,

28

const TensorInfo& weights,

29

const Optional<TensorInfo>& biases)

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

30

{

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

31

const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, descriptor.m_DataLayout);

32

const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output, descriptor.m_DataLayout);

33

34

// ArmNN's weight format is [ M, I, H, W ]

35

const unsigned int aclDepthMultiplier = weights.GetShape()[0];

36

37

// Convert the weight format from ArmNN's [ M, I, H, W ] (does NOT depend on the data layout) to either

38

// [ 1, H, W, I * M ] (if NHWC) or [ 1, I * M, H, W ] (if NCHW), as required by the compute library

39

TensorInfo weightsPermuted = ConvertWeightTensorInfoFromArmnnToAcl(weights, descriptor.m_DataLayout);

40

41

// Convert the weights into the compute library format

42

const arm_compute::TensorInfo aclWeightsInfo = BuildArmComputeTensorInfo(weightsPermuted, descriptor.m_DataLayout);

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

43

44

arm_compute::TensorInfo aclBiasesInfo;

45

arm_compute::TensorInfo *optionalAclBiasesInfo = nullptr;

46

47

if (descriptor.m_BiasEnabled)

48

{

49

BOOST_ASSERT(biases.has_value());

50

51

aclBiasesInfo = BuildArmComputeTensorInfo(biases.value(), descriptor.m_DataLayout);

52

optionalAclBiasesInfo = &aclBiasesInfo;

53

}

54

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

55

arm_compute::PadStrideInfo aclPadStrideInfo = BuildArmComputePadStrideInfo(descriptor);

56

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(

57

descriptor.m_DilationX,descriptor.m_DilationY);

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

58

59

return arm_compute::NEDepthwiseConvolutionLayer::validate(&aclInputInfo,

60

&aclWeightsInfo,

61

optionalAclBiasesInfo,

62

&aclOutputInfo,

63

aclPadStrideInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

64

aclDepthMultiplier,

65

arm_compute::ActivationLayerInfo(),

66

aclDilationInfo);

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

67

}

68

69

NeonDepthwiseConvolutionWorkload::NeonDepthwiseConvolutionWorkload(

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

70

const DepthwiseConvolution2dQueueDescriptor& descriptor,

71

const WorkloadInfo& info)

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

72

: BaseWorkload<DepthwiseConvolution2dQueueDescriptor>(descriptor, info)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

73

{

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

74

// ArmNN's weight format is [ M, I, H, W ]

75

auto& weightInfo = m_Data.m_Weight->GetTensorInfo();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

76

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

77

// Allocate a buffer for the swizzling of the weight tensor

78

std::unique_ptr<unsigned char[]> permuteBuffer(new unsigned char[m_Data.m_Weight->GetTensorInfo().GetNumBytes()]);

79

80

// Convert the weight format from ArmNN's [ M, I, H, W ] (does NOT depend on the data layout) to either

81

// [ 1, H, W, I * M ] (if NHWC) or [ 1, I * M, H, W ] (if NCHW), as required by the compute library

82

ConstTensor weightPermuted = ConvertWeightTensorFromArmnnToAcl(m_Data.m_Weight,

83

m_Data.m_Parameters.m_DataLayout,

84

permuteBuffer.get());

85

86

// Convert the weights into the compute library format

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

87

m_KernelTensor = std::make_unique<arm_compute::Tensor>();

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

88

BuildArmComputeTensor(*m_KernelTensor, weightPermuted.GetInfo(), m_Data.m_Parameters.m_DataLayout);

Mohamed Nour Abouelseoud

2018-11-27 17:35:35 +0000

[diff] [blame]

89

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

90

if (m_Data.m_Parameters.m_BiasEnabled)

91

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

92

m_BiasTensor = std::make_unique<arm_compute::Tensor>();

Nikhil Raj

cec6b65

2018-10-12 13:51:57 +0100

[diff] [blame]

93

BuildArmComputeTensor(*m_BiasTensor, m_Data.m_Bias->GetTensorInfo(), m_Data.m_Parameters.m_DataLayout);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

94

}

95

96

arm_compute::PadStrideInfo padStrideInfo(m_Data.m_Parameters.m_StrideX,

97

m_Data.m_Parameters.m_StrideY,

98

m_Data.m_Parameters.m_PadLeft,

99

m_Data.m_Parameters.m_PadRight,

100

m_Data.m_Parameters.m_PadTop,

101

m_Data.m_Parameters.m_PadBottom,

102

arm_compute::DimensionRoundingType::FLOOR);

103

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

104

105

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(

106

m_Data.m_Parameters.m_DilationX, m_Data.m_Parameters.m_DilationY);

107

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

108

m_Data.ValidateInputsOutputs("NeonDepthwiseConvolutionWorkload", 1, 1);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

109

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

110

INeonTensorHandle* inputTensorHandle = static_cast<INeonTensorHandle*>(m_Data.m_Inputs[0]);

111

INeonTensorHandle* outputTensorHandle = static_cast<INeonTensorHandle*>(m_Data.m_Outputs[0]);

112

Mohamed Nour Abouelseoud

2018-11-27 17:35:35 +0000

[diff] [blame]

113

arm_compute::ITensor& input = inputTensorHandle->GetTensor();

114

arm_compute::ITensor& output = outputTensorHandle->GetTensor();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

115

Nikhil Raj

cec6b65

2018-10-12 13:51:57 +0100

[diff] [blame]

116

arm_compute::DataLayout aclDataLayout = ConvertDataLayout(m_Data.m_Parameters.m_DataLayout);

117

input.info()->set_data_layout(aclDataLayout);

118

output.info()->set_data_layout(aclDataLayout);

119

Bruno Goncalves

22972f0

2019-04-26 21:03:24 -0300

[diff] [blame]

120

// Get the depth multiplier

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

121

const unsigned int depthMultiplier = weightInfo.GetShape()[0];

Mohamed Nour Abouelseoud

2018-11-27 17:35:35 +0000

[diff] [blame]

122

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

123

// Check for optimisation opportunities.

124

bool use3x3Optimisation = (weightInfo.GetShape()[2] == 3) && (weightInfo.GetShape()[3] == 3);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

125

if (use3x3Optimisation)

126

{

127

m_pDepthwiseConvolutionLayer = std::make_unique<arm_compute::NEDepthwiseConvolutionLayer3x3>();

128

static_cast<arm_compute::NEDepthwiseConvolutionLayer3x3*>(

129

m_pDepthwiseConvolutionLayer.get())->configure(&input,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

130

m_KernelTensor.get(),

131

m_BiasTensor.get(),

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

132

&output,

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

133

padStrideInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

134

depthMultiplier,

135

arm_compute::ActivationLayerInfo(),

136

aclDilationInfo);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

}

else

{

m_pDepthwiseConvolutionLayer = std::make_unique<arm_compute::NEDepthwiseConvolutionLayer>();

141

static_cast<arm_compute::NEDepthwiseConvolutionLayer*>(

142

m_pDepthwiseConvolutionLayer.get())->configure(&input,

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

143

m_KernelTensor.get(),

144

m_BiasTensor.get(),

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

145

&output,

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

146

padStrideInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

147

depthMultiplier,

148

arm_compute::ActivationLayerInfo(),

149

aclDilationInfo);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

150

}

151

152

BOOST_ASSERT(m_pDepthwiseConvolutionLayer);

153

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

154

ScopedCpuTensorHandle weightsPermutedHandle(weightPermuted);

155

InitializeArmComputeTensorData(*m_KernelTensor, &weightsPermutedHandle);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

156

Mohamed Nour Abouelseoud

2018-11-27 17:35:35 +0000

[diff] [blame]

157

if (m_Data.m_Parameters.m_BiasEnabled)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

158

{

Nattapat Chaimanowong

177d8d2

2018-10-16 13:21:27 +0100

[diff] [blame]

159

InitializeArmComputeTensorData(*m_BiasTensor, m_Data.m_Bias);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

160

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

161

162

m_pDepthwiseConvolutionLayer->prepare();

163

FreeUnusedTensors();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

164

}

165

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

166

void NeonDepthwiseConvolutionWorkload::Execute() const

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

167

{

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

168

ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonDepthwiseConvolutionWorkload_Execute");

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

169

BOOST_ASSERT(m_pDepthwiseConvolutionLayer);

170

171

m_pDepthwiseConvolutionLayer->run();

172

}

173

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

174

void NeonDepthwiseConvolutionWorkload::FreeUnusedTensors()

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

175

{

176

FreeTensorIfUnused(m_KernelTensor);

177

FreeTensorIfUnused(m_BiasTensor);

178

}

179

telsoa01