Blame - src/backends/neon/workloads/NeonDepthwiseConvolutionWorkload.cpp - ml/armnn

2018-03-09 14:13:49 +0000

[diff] [blame]

1

//

2

David Beck

ecb56cd

2018-09-05 12:52:57 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

4

//

5

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

6

#include "NeonDepthwiseConvolutionWorkload.hpp"

7

Matthew Bentham

d80a712

2019-01-08 17:52:37 +0000

[diff] [blame]

8

#include "NeonWorkloadUtils.hpp"

9

Matteo Martincigh

e011d20

2019-11-28 11:35:47 +0000

[diff] [blame]

10

#include <armnnUtils/DataLayoutIndexed.hpp>

11

Aron Virginas-Tar

c9cc804

2018-11-01 16:15:57 +0000

[diff] [blame]

12

#include <aclCommon/ArmComputeTensorUtils.hpp>

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

13

#include <aclCommon/ArmComputeUtils.hpp>

Matteo Martincigh

e011d20

2019-11-28 11:35:47 +0000

[diff] [blame]

14

Aron Virginas-Tar

c9cc804

2018-11-01 16:15:57 +0000

[diff] [blame]

15

#include <neon/NeonLayerSupport.hpp>

Matteo Martincigh

e011d20

2019-11-28 11:35:47 +0000

[diff] [blame]

16

James Conroy

1f58f03

2021-04-27 17:13:27 +0100

[diff] [blame]

17

#include <backendsCommon/TensorHandle.hpp>

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

18

#include <backendsCommon/WorkloadUtils.hpp>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

19

Matthew Bentham

d80a712

2019-01-08 17:52:37 +0000

[diff] [blame]

20

#include <arm_compute/runtime/NEON/functions/NEDepthwiseConvolutionLayer.h>

21

22

using namespace armnnUtils;

23

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

24

namespace armnn

25

{

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

26

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

27

using namespace armcomputetensorutils;

28

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

29

arm_compute::Status NeonDepthwiseConvolutionWorkloadValidate(const TensorInfo& input,

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

30

const TensorInfo& output,

31

const DepthwiseConvolution2dDescriptor& descriptor,

32

const TensorInfo& weights,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

33

const Optional<TensorInfo>& biases,

34

const ActivationDescriptor* activationDescriptor)

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

35

{

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

36

const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, descriptor.m_DataLayout);

37

const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output, descriptor.m_DataLayout);

38

39

// ArmNN's weight format is [ M, I, H, W ]

40

const unsigned int aclDepthMultiplier = weights.GetShape()[0];

41

42

// Convert the weight format from ArmNN's [ M, I, H, W ] (does NOT depend on the data layout) to either

43

// [ 1, H, W, I * M ] (if NHWC) or [ 1, I * M, H, W ] (if NCHW), as required by the compute library

44

TensorInfo weightsPermuted = ConvertWeightTensorInfoFromArmnnToAcl(weights, descriptor.m_DataLayout);

45

46

// Convert the weights into the compute library format

47

const arm_compute::TensorInfo aclWeightsInfo = BuildArmComputeTensorInfo(weightsPermuted, descriptor.m_DataLayout);

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

48

49

arm_compute::TensorInfo aclBiasesInfo;

50

arm_compute::TensorInfo *optionalAclBiasesInfo = nullptr;

51

52

if (descriptor.m_BiasEnabled)

53

{

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

54

ARMNN_ASSERT(biases.has_value());

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

55

56

aclBiasesInfo = BuildArmComputeTensorInfo(biases.value(), descriptor.m_DataLayout);

57

optionalAclBiasesInfo = &aclBiasesInfo;

58

}

59

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

60

arm_compute::PadStrideInfo aclPadStrideInfo = BuildArmComputePadStrideInfo(descriptor);

61

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(

62

descriptor.m_DilationX,descriptor.m_DilationY);

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

63

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

64

const arm_compute::ActivationLayerInfo activationInfo = ConvertActivationDescriptorToAclActivationLayerInfo(

65

activationDescriptor);

66

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

67

return arm_compute::NEDepthwiseConvolutionLayer::validate(&aclInputInfo,

68

&aclWeightsInfo,

69

optionalAclBiasesInfo,

70

&aclOutputInfo,

71

aclPadStrideInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

72

aclDepthMultiplier,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

73

activationInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

74

aclDilationInfo);

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

75

}

76

77

NeonDepthwiseConvolutionWorkload::NeonDepthwiseConvolutionWorkload(

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

78

const DepthwiseConvolution2dQueueDescriptor& descriptor,

79

const WorkloadInfo& info)

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

80

: BaseWorkload<DepthwiseConvolution2dQueueDescriptor>(descriptor, info)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

81

{

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

82

// ArmNN's weight format is [ M, I, H, W ]

83

auto& weightInfo = m_Data.m_Weight->GetTensorInfo();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

84

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

85

// Allocate a buffer for the swizzling of the weight tensor

86

std::unique_ptr<unsigned char[]> permuteBuffer(new unsigned char[m_Data.m_Weight->GetTensorInfo().GetNumBytes()]);

87

88

// Convert the weight format from ArmNN's [ M, I, H, W ] (does NOT depend on the data layout) to either

89

// [ 1, H, W, I * M ] (if NHWC) or [ 1, I * M, H, W ] (if NCHW), as required by the compute library

90

ConstTensor weightPermuted = ConvertWeightTensorFromArmnnToAcl(m_Data.m_Weight,

91

m_Data.m_Parameters.m_DataLayout,

92

permuteBuffer.get());

93

94

// Convert the weights into the compute library format

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

95

m_KernelTensor = std::make_unique<arm_compute::Tensor>();

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

96

BuildArmComputeTensor(*m_KernelTensor, weightPermuted.GetInfo(), m_Data.m_Parameters.m_DataLayout);

Mohamed Nour Abouelseoud

2018-11-27 17:35:35 +0000

[diff] [blame]

97

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

98

if (m_Data.m_Parameters.m_BiasEnabled)

99

{

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

100

m_BiasTensor = std::make_unique<arm_compute::Tensor>();

Nikhil Raj

cec6b65

2018-10-12 13:51:57 +0100

[diff] [blame]

101

BuildArmComputeTensor(*m_BiasTensor, m_Data.m_Bias->GetTensorInfo(), m_Data.m_Parameters.m_DataLayout);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

102

}

103

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

104

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(

105

m_Data.m_Parameters.m_DilationX, m_Data.m_Parameters.m_DilationY);

106

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

107

m_Data.ValidateInputsOutputs("NeonDepthwiseConvolutionWorkload", 1, 1);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

108

Derek Lamberti

c81855f

2019-06-13 17:34:19 +0100

[diff] [blame]

109

IAclTensorHandle* inputTensorHandle = static_cast<IAclTensorHandle*>(m_Data.m_Inputs[0]);

110

IAclTensorHandle* outputTensorHandle = static_cast<IAclTensorHandle*>(m_Data.m_Outputs[0]);

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

111

Mohamed Nour Abouelseoud

2018-11-27 17:35:35 +0000

[diff] [blame]

112

arm_compute::ITensor& input = inputTensorHandle->GetTensor();

113

arm_compute::ITensor& output = outputTensorHandle->GetTensor();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

114

Nikhil Raj

cec6b65

2018-10-12 13:51:57 +0100

[diff] [blame]

115

arm_compute::DataLayout aclDataLayout = ConvertDataLayout(m_Data.m_Parameters.m_DataLayout);

116

input.info()->set_data_layout(aclDataLayout);

117

output.info()->set_data_layout(aclDataLayout);

118

Bruno Goncalves

22972f0

2019-04-26 21:03:24 -0300

[diff] [blame]

119

// Get the depth multiplier

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

120

const unsigned int depthMultiplier = weightInfo.GetShape()[0];

Mohamed Nour Abouelseoud

2018-11-27 17:35:35 +0000

[diff] [blame]

121

Aron Virginas-Tar

6f3785d

2019-07-22 15:30:22 +0100

[diff] [blame]

122

arm_compute::PadStrideInfo padStrideInfo = BuildArmComputePadStrideInfo(m_Data.m_Parameters);

123

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

124

const arm_compute::ActivationLayerInfo activationInfo = ConvertAdditionalInfoToAclActivationLayerInfo(descriptor);

125

Aron Virginas-Tar

f4c502f

2019-11-14 16:21:38 +0000

[diff] [blame]

126

m_pDepthwiseConvolutionLayer = std::make_unique<arm_compute::NEDepthwiseConvolutionLayer>();

127

static_cast<arm_compute::NEDepthwiseConvolutionLayer*>(

128

m_pDepthwiseConvolutionLayer.get())->configure(&input,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

129

m_KernelTensor.get(),

m_BiasTensor.get(),

&output,

padStrideInfo,

depthMultiplier,

activationInfo,

aclDilationInfo);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

136

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

137

ARMNN_ASSERT(m_pDepthwiseConvolutionLayer);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

138

James Conroy

1f58f03

2021-04-27 17:13:27 +0100

[diff] [blame]

139

ScopedTensorHandle weightsPermutedHandle(weightPermuted);

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

140

InitializeArmComputeTensorData(*m_KernelTensor, &weightsPermutedHandle);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

141

Mohamed Nour Abouelseoud

2018-11-27 17:35:35 +0000

[diff] [blame]

142

if (m_Data.m_Parameters.m_BiasEnabled)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

143

{

Nattapat Chaimanowong

177d8d2

2018-10-16 13:21:27 +0100

[diff] [blame]

144

InitializeArmComputeTensorData(*m_BiasTensor, m_Data.m_Bias);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

145

}

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

146

147

m_pDepthwiseConvolutionLayer->prepare();

148

FreeUnusedTensors();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

149

}

150

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

151

void NeonDepthwiseConvolutionWorkload::Execute() const

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

152

{

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

153

ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonDepthwiseConvolutionWorkload_Execute");

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

154

ARMNN_ASSERT(m_pDepthwiseConvolutionLayer);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

155

156

m_pDepthwiseConvolutionLayer->run();

157

}

158

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

159

void NeonDepthwiseConvolutionWorkload::FreeUnusedTensors()

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

160

{

161

FreeTensorIfUnused(m_KernelTensor);

162

FreeTensorIfUnused(m_BiasTensor);

163

}

164

telsoa01