Blame - src/backends/cl/workloads/ClDepthwiseConvolutionWorkload.cpp - ml/armnn

2018-08-31 09:22:23 +0100

[diff] [blame]

1

//

Teresa Charlin

588cbdf

2022-01-19 15:55:37 +0000

[diff] [blame]

2

David Beck

ecb56cd

2018-09-05 12:52:57 +0100

[diff] [blame]

3

// SPDX-License-Identifier: MIT

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

4

//

5

Matthew Bentham

2018-10-08 09:38:55 +0100

[diff] [blame]

6

#include "ClDepthwiseConvolutionWorkload.hpp"

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

7

Aron Virginas-Tar

d4f0fea

2019-04-09 14:08:06 +0100

[diff] [blame]

8

#include <ResolveType.hpp>

Matthew Bentham

2018-10-08 09:38:55 +0100

[diff] [blame]

9

#include "ClWorkloadUtils.hpp"

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

10

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

11

#include <armnn/Exceptions.hpp>

Aron Virginas-Tar

c9cc804

2018-11-01 16:15:57 +0000

[diff] [blame]

12

#include <aclCommon/ArmComputeUtils.hpp>

13

#include <aclCommon/ArmComputeTensorUtils.hpp>

14

#include <cl/ClTensorHandle.hpp>

Colm Donelan

0c47974

2021-12-10 12:43:54 +0000

[diff] [blame]

15

#include <armnn/backends/TensorHandle.hpp>

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

16

#include <backendsCommon/WorkloadUtils.hpp>

Colm Donelan

0c47974

2021-12-10 12:43:54 +0000

[diff] [blame]

17

#include <armnn/backends/WorkloadData.hpp>

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

18

Matthew Bentham

2018-10-08 09:38:55 +0100

[diff] [blame]

19

#include <arm_compute/runtime/CL/functions/CLDepthwiseConvolutionLayer.h>

20

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

namespace armnn

{

using namespace armcomputetensorutils;

25

26

arm_compute::Status ClDepthwiseConvolutionWorkloadValidate(const TensorInfo& input,

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

27

const TensorInfo& output,

28

const DepthwiseConvolution2dDescriptor& descriptor,

29

const TensorInfo& weights,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

30

const Optional<TensorInfo>& biases,

31

const ActivationDescriptor* activationDescriptor)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

32

{

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

33

const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, descriptor.m_DataLayout);

Nikhil Raj

a05c210

2018-09-25 16:16:13 +0100

[diff] [blame]

34

const arm_compute::TensorInfo aclOutputInfo = BuildArmComputeTensorInfo(output, descriptor.m_DataLayout);

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

35

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

36

// ArmNN format for weights for depthwise is [1, H, W, C] independently of the input/output layout

37

//

38

// ACL format for weights for depthwise is:

39

// - [1, H, W, C] for [N, H, W, C] input/output layout (matches with ArmNN)

40

// - [1, C, H, W] for [N, C, H, W] input/output layout

41

//

42

// Therefore ArmNN weights have to be permuted when input/output layout is [N, C, H, W] to pass them to ACL.

43

// The PermuteDepthwiseConv2dWeights backend optimization takes care of this, but it has not been performed yet,

44

// so we do the permute here for the TensorInfo weights.

Jan Eilers

53ef795

2021-06-02 12:01:25 +0100

[diff] [blame]

45

unsigned int aclDepthMultiplier;

46

TensorInfo weightsPermuted;

47

std::tie(weightsPermuted, aclDepthMultiplier) = Convert1HWOTensorInfoToAcl(weights, input,descriptor.m_DataLayout);

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

48

49

// Convert the weights into the compute library format

Cathal Corbett

4452baf

2022-05-13 09:55:59 +0100

[diff] [blame]

50

arm_compute::TensorInfo aclWeightsInfo = BuildArmComputeTensorInfo(weightsPermuted, descriptor.m_DataLayout);

51

aclWeightsInfo.set_are_values_constant(weights.IsConstant());

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

52

53

arm_compute::TensorInfo aclBiasesInfo;

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

54

arm_compute::TensorInfo* optionalAclBiasesInfo = nullptr;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

55

if (descriptor.m_BiasEnabled)

56

{

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

57

ARMNN_ASSERT(biases.has_value());

Cathal Corbett

4452baf

2022-05-13 09:55:59 +0100

[diff] [blame]

58

// Same for bias as weights. We don't currently support non const.

59

if (!biases.value().IsConstant())

60

{

61

return arm_compute::Status{arm_compute::ErrorCode::RUNTIME_ERROR,

62

"ArmNN ClDepthwiseConv2dWorkload does not support non constant bias."};

63

}

David Beck

5eec11d

2018-10-04 15:43:17 +0100

[diff] [blame]

64

aclBiasesInfo = BuildArmComputeTensorInfo(biases.value(), descriptor.m_DataLayout);

Cathal Corbett

4452baf

2022-05-13 09:55:59 +0100

[diff] [blame]

65

aclBiasesInfo.set_are_values_constant(biases.value().IsConstant());

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

66

optionalAclBiasesInfo = &aclBiasesInfo;

67

}

68

69

const arm_compute::PadStrideInfo aclPadStrideInfo = BuildArmComputePadStrideInfo(descriptor);

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

70

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(

71

descriptor.m_DilationX,

72

descriptor.m_DilationY);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

73

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

74

const arm_compute::ActivationLayerInfo activationInfo = ConvertActivationDescriptorToAclActivationLayerInfo(

75

activationDescriptor);

76

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

77

return arm_compute::CLDepthwiseConvolutionLayer::validate(&aclInputInfo,

78

&aclWeightsInfo,

79

optionalAclBiasesInfo,

80

&aclOutputInfo,

81

aclPadStrideInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

82

aclDepthMultiplier,

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

83

activationInfo,

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

84

aclDilationInfo);

85

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

86

}

87

Matthew Bentham

2018-10-08 09:38:55 +0100

[diff] [blame]

88

ClDepthwiseConvolutionWorkload::ClDepthwiseConvolutionWorkload(

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

89

const DepthwiseConvolution2dQueueDescriptor& descriptor,

Sadik Armagan

e944475

2020-12-02 11:28:58 +0000

[diff] [blame]

90

const WorkloadInfo& info,

91

const arm_compute::CLCompileContext& clCompileContext)

Teresa Charlin

588cbdf

2022-01-19 15:55:37 +0000

[diff] [blame]

92

: ClBaseWorkload<DepthwiseConvolution2dQueueDescriptor>(descriptor, info)

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

93

{

Keith Davis

bcd860a

2021-08-05 14:20:33 +0100

[diff] [blame]

94

// Add details for profiling output

95

WorkloadInfo detailsInfo;

96

97

detailsInfo.m_InputTensorInfos = info.m_InputTensorInfos;

98

detailsInfo.m_OutputTensorInfos = info.m_OutputTensorInfos;

99

detailsInfo.m_WeightsTensorInfo = armnn::Optional<armnn::TensorInfo>(descriptor.m_Weight->GetTensorInfo());

100

if (descriptor.m_Parameters.m_BiasEnabled)

101

{

102

detailsInfo.m_BiasTensorInfo = armnn::Optional<armnn::TensorInfo>(descriptor.m_Bias->GetTensorInfo());

103

}

104

105

// Report Profiling Details

106

ARMNN_REPORT_PROFILING_WORKLOAD_DESC("ClDepthwiseConvolutionWorkload_Construct",

107

descriptor.m_Parameters,

108

detailsInfo,

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

109

GetGuid());

Keith Davis

bcd860a

2021-08-05 14:20:33 +0100

[diff] [blame]

110

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

111

m_Data.ValidateInputsOutputs("ClDepthwiseConv2dWorkload", descriptor.m_Parameters.GetNumInputs(), 1);

Matteo Martincigh

2018-12-18 09:26:39 +0000

[diff] [blame]

112

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

113

arm_compute::ICLTensor& input = PolymorphicDowncast<IClTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();

114

arm_compute::ICLTensor& output = PolymorphicDowncast<IClTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();

115

arm_compute::ICLTensor& weights = PolymorphicDowncast<IClTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();

116

arm_compute::ITensorInfo* weightsInfo = weights.info();

117

arm_compute::ITensorInfo* inputInfo = input.info();

118

auto weightsShape = weightsInfo->tensor_shape();

119

auto inputShape = inputInfo->tensor_shape();

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

120

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

121

// The PermuteDepthwiseConv2dWeights backend optimization has been performed,

122

// converting weights to have the same data layout as input.

123

unsigned int depthMultiplier =

124

ComputeDepthwiseConv2dDepthMultiplier(m_Data.m_Parameters.m_DataLayout, weightsShape, inputShape);

125

126

arm_compute::ICLTensor* bias = nullptr;

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

127

if (m_Data.m_Parameters.m_BiasEnabled)

128

{

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

129

bias = &PolymorphicDowncast<IClTensorHandle*>(m_Data.m_Inputs[2])->GetTensor();

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

130

}

131

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

132

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(

133

m_Data.m_Parameters.m_DilationX,

134

m_Data.m_Parameters.m_DilationY);

135

Nikhil Raj

cec6b65

2018-10-12 13:51:57 +0100

[diff] [blame]

136

arm_compute::DataLayout aclDataLayout = ConvertDataLayout(m_Data.m_Parameters.m_DataLayout);

137

input.info()->set_data_layout(aclDataLayout);

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

138

weights.info()->set_data_layout(aclDataLayout);

Nikhil Raj

cec6b65

2018-10-12 13:51:57 +0100

[diff] [blame]

139

output.info()->set_data_layout(aclDataLayout);

140

Aron Virginas-Tar

6f3785d

2019-07-22 15:30:22 +0100

[diff] [blame]

141

arm_compute::PadStrideInfo padStrideInfo = BuildArmComputePadStrideInfo(m_Data.m_Parameters);

Pablo Tello

2019-04-26 17:58:13 +0100

[diff] [blame]

142

Mike Kelly

2020-11-12 10:58:48 +0000

[diff] [blame]

143

const arm_compute::ActivationLayerInfo activationInfo = ConvertAdditionalInfoToAclActivationLayerInfo(descriptor);

144

Aron Virginas-Tar

f4c502f

2019-11-14 16:21:38 +0000

[diff] [blame]

145

m_DepthwiseConvolutionLayer = std::make_unique<arm_compute::CLDepthwiseConvolutionLayer>();

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

146

Kevin May

9f6862d

2021-10-22 15:42:28 +0100

[diff] [blame]

147

{

148

ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "ClDepthwiseConvolutionWorkload_configure");

149

static_cast<arm_compute::CLDepthwiseConvolutionLayer*>(m_DepthwiseConvolutionLayer.get())->configure(

150

clCompileContext,

151

&input,

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

152

&weights,

153

bias,

Kevin May

9f6862d

2021-10-22 15:42:28 +0100

[diff] [blame]

&output,

padStrideInfo,

depthMultiplier,

activationInfo,

aclDilationInfo);

}

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

160

ARMNN_ASSERT(m_DepthwiseConvolutionLayer);

telsoa01

2018-08-31 09:22:23 +0100

[diff] [blame]

161

}

162

Matthew Bentham

2018-10-08 09:38:55 +0100

[diff] [blame]

163

void ClDepthwiseConvolutionWorkload::Execute() const

164

{

Cathal Corbett

2022-05-11 20:12:17 +0100

[diff] [blame]

165

ARMNN_SCOPED_PROFILING_EVENT_CL_GUID("ClDepthwiseConvolutionWorkload_Execute", GetGuid());

Narumol Prangnawarat

ac2770a

2020-04-01 16:51:23 +0100

[diff] [blame]

166

ARMNN_ASSERT(m_DepthwiseConvolutionLayer);

Matthew Bentham

2018-10-08 09:38:55 +0100

[diff] [blame]

167

Aron Virginas-Tar

a8e06ed

2018-10-19 16:46:15 +0100

[diff] [blame]

168

RunClFunction(*m_DepthwiseConvolutionLayer, CHECK_LOCATION());

Matthew Bentham

2018-10-08 09:38:55 +0100

[diff] [blame]

169

}

telsoa01