Blame - src/backends/neon/workloads/NeonDepthwiseConvolutionWorkload.cpp - ml/armnn

2018-03-09 14:13:49 +0000

[diff] [blame]

1

//

Mike Kelly

ec67a0f

2022-11-25 13:55:24 +0000

[diff] [blame^]

2

David Beck

ecb56cd

2018-09-05 12:52:57 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

4

//

5

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

6

#include "NeonDepthwiseConvolutionWorkload.hpp"

7

Matthew Bentham

d80a712

2019-01-08 17:52:37 +0000

[diff] [blame]

8

#include "NeonWorkloadUtils.hpp"

9

Matteo Martincigh

e011d20

2019-11-28 11:35:47 +0000

[diff] [blame]

10

#include <armnnUtils/DataLayoutIndexed.hpp>

11

Aron Virginas-Tar

c9cc804

2018-11-01 16:15:57 +0000

[diff] [blame]

12

#include <aclCommon/ArmComputeTensorUtils.hpp>

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

13

#include <aclCommon/ArmComputeUtils.hpp>

Matteo Martincigh

e011d20

2019-11-28 11:35:47 +0000

[diff] [blame]

14

Aron Virginas-Tar

c9cc804

2018-11-01 16:15:57 +0000

[diff] [blame]

15

#include <neon/NeonLayerSupport.hpp>

Matteo Martincigh

e011d20

2019-11-28 11:35:47 +0000

[diff] [blame]

16

Colm Donelan

0c47974

2021-12-10 12:43:54 +0000

[diff] [blame]

17

#include <armnn/backends/TensorHandle.hpp>

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

18

#include <backendsCommon/WorkloadUtils.hpp>

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

19

Matthew Bentham

d80a712

2019-01-08 17:52:37 +0000

[diff] [blame]

20

#include <arm_compute/runtime/NEON/functions/NEDepthwiseConvolutionLayer.h>

21

22

using namespace armnnUtils;

23

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

24

namespace armnn

25

{

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

26

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

27

using namespace armcomputetensorutils;

28

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

29

arm_compute::Status NeonDepthwiseConvolutionWorkloadValidate(const TensorInfo& input,

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

30

const TensorInfo& output,

31

const DepthwiseConvolution2dDescriptor& descriptor,

32

const TensorInfo& weights,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

33

const Optional<TensorInfo>& biases,

34

const ActivationDescriptor* activationDescriptor)

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

35

{

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

36

const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, descriptor.m_DataLayout);

37

const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output, descriptor.m_DataLayout);

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

38

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

39

// ArmNN format for weights for depthwise is [1, H, W, C] independently of the input/output layout

40

//

41

// ACL format for weights for depthwise is:

42

// - [1, H, W, C] for [N, H, W, C] input/output layout (matches with ArmNN)

43

// - [1, C, H, W] for [N, C, H, W] input/output layout

44

//

45

// Therefore ArmNN weights have to be permuted when input/output layout is [N, C, H, W] to pass them to ACL.

46

// The PermuteDepthwiseConv2dWeights backend optimization takes care of this, but it has not been performed yet,

47

// so we do the permute here for the TensorInfo weights.

Jan Eilers

53ef795

2021-06-02 12:01:25 +0100

[diff] [blame]

48

unsigned int aclDepthMultiplier;

49

TensorInfo weightsPermuted;

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

50

std::tie(weightsPermuted, aclDepthMultiplier) = Convert1HWOTensorInfoToAcl(weights, input, descriptor.m_DataLayout);

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

51

52

// Convert the weights into the compute library format

Cathal Corbett

4452baf

2022-05-13 09:55:59 +0100

[diff] [blame]

53

arm_compute::TensorInfo aclWeightsInfo = BuildArmComputeTensorInfo(weightsPermuted, descriptor.m_DataLayout);

54

aclWeightsInfo.set_are_values_constant(weights.IsConstant());

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

55

56

arm_compute::TensorInfo aclBiasesInfo;

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

57

arm_compute::TensorInfo* optionalAclBiasesInfo = nullptr;

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

58

if (descriptor.m_BiasEnabled)

59

{

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

60

ARMNN_ASSERT(biases.has_value());

Cathal Corbett

4452baf

2022-05-13 09:55:59 +0100

[diff] [blame]

61

// Same for bias as weights. We don't currently support non const.

62

if (!biases.value().IsConstant())

63

{

64

return arm_compute::Status{arm_compute::ErrorCode::RUNTIME_ERROR,

65

"ArmNN NeonDepthwiseConv2dWorkload does not support non constant bias."};

66

}

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

67

aclBiasesInfo = BuildArmComputeTensorInfo(biases.value(), descriptor.m_DataLayout);

Cathal Corbett

4452baf

2022-05-13 09:55:59 +0100

[diff] [blame]

68

aclBiasesInfo.set_are_values_constant(biases.value().IsConstant());

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

69

optionalAclBiasesInfo = &aclBiasesInfo;

70

}

71

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

72

arm_compute::PadStrideInfo aclPadStrideInfo = BuildArmComputePadStrideInfo(descriptor);

73

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

74

descriptor.m_DilationX, descriptor.m_DilationY);

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

75

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

76

const arm_compute::ActivationLayerInfo activationInfo = ConvertActivationDescriptorToAclActivationLayerInfo(

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

77

activationDescriptor);

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

78

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

79

return arm_compute::NEDepthwiseConvolutionLayer::validate(&aclInputInfo,

80

&aclWeightsInfo,

81

optionalAclBiasesInfo,

82

&aclOutputInfo,

83

aclPadStrideInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

84

aclDepthMultiplier,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

85

activationInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

86

aclDilationInfo);

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

87

}

88

89

NeonDepthwiseConvolutionWorkload::NeonDepthwiseConvolutionWorkload(

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

90

const DepthwiseConvolution2dQueueDescriptor& descriptor,

91

const WorkloadInfo& info)

Teresa Charlin

588cbdf

2022-01-19 15:55:37 +0000

[diff] [blame]

92

: NeonBaseWorkload<DepthwiseConvolution2dQueueDescriptor>(descriptor, info)

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

93

{

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

94

arm_compute::ITensor& input = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();

95

arm_compute::ITensor& output = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();

96

arm_compute::ITensor& weights = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();

97

arm_compute::ITensor* biasesPtr = nullptr;

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

98

if (m_Data.m_Parameters.m_BiasEnabled)

99

{

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

100

biasesPtr = &PolymorphicDowncast<IAclTensorHandle *>(m_Data.m_Inputs[2])->GetTensor();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

101

}

102

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

103

arm_compute::ITensorInfo* weightsInfo = weights.info();

104

arm_compute::ITensorInfo* inputInfo = input.info();

105

auto weightsShape = weightsInfo->tensor_shape();

106

auto inputShape = inputInfo->tensor_shape();

107

108

// The PermuteDepthwiseConv2dWeights backend optimization has been performed,

109

// converting weights to have the same data layout as input.

110

unsigned int depthMultiplier =

111

ComputeDepthwiseConv2dDepthMultiplier(m_Data.m_Parameters.m_DataLayout, weightsShape, inputShape);

112

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

113

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

114

m_Data.m_Parameters.m_DilationX, m_Data.m_Parameters.m_DilationY);

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

115

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

116

uint32_t numInputs = m_Data.m_Parameters.m_BiasEnabled ? 3: 2;

117

m_Data.ValidateInputsOutputs("NeonDepthwiseConvolutionWorkload", numInputs, 1);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

118

Nikhil Raj

cec6b65

2018-10-12 13:51:57 +0100

[diff] [blame]

119

arm_compute::DataLayout aclDataLayout = ConvertDataLayout(m_Data.m_Parameters.m_DataLayout);

120

input.info()->set_data_layout(aclDataLayout);

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

121

weights.info()->set_data_layout(aclDataLayout);

Nikhil Raj

cec6b65

2018-10-12 13:51:57 +0100

[diff] [blame]

122

output.info()->set_data_layout(aclDataLayout);

123

Aron Virginas-Tar

6f3785d

2019-07-22 15:30:22 +0100

[diff] [blame]

124

arm_compute::PadStrideInfo padStrideInfo = BuildArmComputePadStrideInfo(m_Data.m_Parameters);

125

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

126

const arm_compute::ActivationLayerInfo activationInfo = ConvertAdditionalInfoToAclActivationLayerInfo(descriptor);

127

Aron Virginas-Tar

f4c502f

2019-11-14 16:21:38 +0000

[diff] [blame]

128

m_pDepthwiseConvolutionLayer = std::make_unique<arm_compute::NEDepthwiseConvolutionLayer>();

129

static_cast<arm_compute::NEDepthwiseConvolutionLayer*>(

130

m_pDepthwiseConvolutionLayer.get())->configure(&input,

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

131

&weights,

132

biasesPtr,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

&output,

padStrideInfo,

depthMultiplier,

activationInfo,

aclDilationInfo);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

138

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

139

// Add details for profiling output

140

WorkloadInfo detailsInfo;

141

142

detailsInfo.m_InputTensorInfos = info.m_InputTensorInfos;

143

detailsInfo.m_OutputTensorInfos = info.m_OutputTensorInfos;

Mike Kelly

ec67a0f

2022-11-25 13:55:24 +0000

[diff] [blame^]

144

detailsInfo.m_WeightsTensorInfo = armnn::Optional<armnn::TensorInfo>(info.m_InputTensorInfos[1]);

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

145

if (descriptor.m_Parameters.m_BiasEnabled)

146

{

Mike Kelly

ec67a0f

2022-11-25 13:55:24 +0000

[diff] [blame^]

147

detailsInfo.m_BiasTensorInfo = armnn::Optional<armnn::TensorInfo>(info.m_InputTensorInfos[2]);

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

148

}

149

150

// Report Profiling Details

151

ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonDepthwiseConvolution2dWorkload_Construct",

152

descriptor.m_Parameters,

153

detailsInfo,

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

154

GetGuid());

Keith Davis

2021-08-05 11:35:00 +0100

[diff] [blame]

155

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

156

ARMNN_ASSERT(m_pDepthwiseConvolutionLayer);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

157

telsoa01

c577f2c

2018-08-31 09:22:23 +0100

[diff] [blame]

158

m_pDepthwiseConvolutionLayer->prepare();

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

159

}

160

Nattapat Chaimanowong

2018-10-17 11:12:19 +0100

[diff] [blame]

161

void NeonDepthwiseConvolutionWorkload::Execute() const

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

162

{

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

163

ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonDepthwiseConvolutionWorkload_Execute", GetGuid());

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

164

ARMNN_ASSERT(m_pDepthwiseConvolutionLayer);

telsoa01

2018-03-09 14:13:49 +0000

[diff] [blame]

165

166

m_pDepthwiseConvolutionLayer->run();

167

}

168

telsoa01