Blame - src/backends/gpuFsa/layers/GpuFsaConvolution2d.cpp - ml/armnn

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

1

//

2

3

// SPDX-License-Identifier: MIT

4

//

5

6

#include "GpuFsaConvolution2d.hpp"

7

8

#include <armnn/Types.hpp>

9

10

#include <aclCommon/ArmComputeTensorUtils.hpp>

11

12

#include <arm_compute/core/ITensorInfo.h>

13

#include <arm_compute/core/TensorInfo.h>

14

#include <arm_compute/core/TensorShape.h>

15

#include <arm_compute/core/CL/CLKernelLibrary.h>

16

#include <arm_compute/core/CL/CLCompileContext.h>

17

18

#include <arm_compute/dynamic_fusion/runtime/gpu/cl/ClWorkloadRuntime.h>

19

#include <arm_compute/dynamic_fusion/sketch/gpu/GpuWorkloadContext.h>

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

20

#include <arm_compute/dynamic_fusion/sketch/gpu/operators/GpuConv2d.h>

21

#include <arm_compute/dynamic_fusion/sketch/gpu/operators/GpuOutput.h>

#include <vector>

#include <iostream>

namespace armnn

{

using namespace armcomputetensorutils;

30

31

arm_compute::Status GpuFsaConvolution2dValidate(const TensorInfo& input,

32

const Convolution2dDescriptor& descriptor,

33

const TensorInfo& weights,

34

const Optional<TensorInfo>& biases)

35

{

36

// Create a new workload sketch, for validation purposes

37

auto compileCtx = arm_compute::CLKernelLibrary::get().get_compile_context();

38

auto workloadContext = GpuWorkloadContext(&compileCtx);

39

GpuWorkloadSketch sketch{ &workloadContext };

40

41

// Build and create tensor infos using the sketch

42

const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, descriptor.m_DataLayout);

43

arm_compute::TensorInfo aclWeightsInfo = BuildArmComputeTensorInfo(weights, descriptor.m_DataLayout);

44

aclWeightsInfo.set_are_values_constant(weights.IsConstant());

45

46

auto inputInfo = workloadContext.create_tensor_info(aclInputInfo);

47

auto weightInfo = workloadContext.create_tensor_info(aclWeightsInfo);

48

49

// Only create the bias tensor info if enabled, otherwise pass nullptr to validate_op

50

arm_compute::TensorInfo aclBiasInfo;

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

51

arm_compute::ITensorInfo* biasSketchInfoPtr = nullptr;

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

52

53

if (descriptor.m_BiasEnabled)

54

{

55

if(!biases.has_value())

56

{

57

throw InvalidArgumentException("GpuFsaConvolution2d::ValidateOp: No biases set when biases are enabled");

58

}

59

aclBiasInfo = BuildArmComputeTensorInfo(biases.value(), descriptor.m_DataLayout);

60

aclBiasInfo.set_are_values_constant(biases.value().IsConstant());

61

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

62

biasSketchInfoPtr = workloadContext.create_tensor_info(aclBiasInfo);

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

63

}

64

65

// Set Conv2d attributes using descriptor

66

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(descriptor.m_DilationX,

67

descriptor.m_DilationY);

68

const arm_compute::Padding2D aclPadInfo = BuildArmComputePaddingInfo(descriptor);

69

const arm_compute::Size2D aclStrideInfo = BuildArmComputeSize2D(descriptor.m_StrideX, descriptor.m_StrideY);

70

71

Conv2dAttributes conv2DAttributes{};

72

conv2DAttributes.dilation(aclDilationInfo);

73

conv2DAttributes.pad(aclPadInfo);

74

conv2DAttributes.stride(aclStrideInfo);

75

76

// Validate operator, check status and update reasonIfUnsupported

77

arm_compute::Status aclStatus = GpuConv2d::validate_op(sketch,

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

78

inputInfo,

79

weightInfo,

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

biasSketchInfoPtr,

conv2DAttributes);

return aclStatus;

}

void GpuFsaConvolution2dCreateOp(GpuFsaPreCompiledBlob* blob,

87

const TensorInfo& input,

88

const Convolution2dDescriptor& descriptor,

89

const TensorInfo& weights,

90

const Optional<TensorInfo>& biases)

91

{

92

/*

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

93

* Creating an Op for the GpuFsa backend requires us to create and maintain quite a bit of data, which is then stored

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

94

* in a GpuFsaPreCompiledBlob for execution later. Specifically we need:

95

* GpuWorkloadContext, this contains the TensorInfos and is unique to the Graph being executed

96

* Sketch, this is similar to a subgraph and can contain one or more operations. Multiple ops can be "fused" together

97

* using a single sketch.

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

98

* The inputTensorinfos / outputTensorInfos, these are pointers to the TensorInfos used when creating the sketch.

99

* They refer to the TensorInfos stored within the GpuWorkloadContext and are needed when executing the sketch

100

* as the TensorInfos used when creating the Tensors must match those used to create the Sketch. Otherwise the runtime

101

* doesn't know which Tensors to use.

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

102

*/

103

using namespace arm_compute::experimental::dynamic_fusion;

104

GpuWorkloadSketch* sketch = blob->sketch.get();

105

GpuWorkloadContext* workloadContext = blob->workloadContext.get();

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

106

std::vector<arm_compute::ITensorInfo*> inputTensorInfos = {};

107

std::vector<arm_compute::ITensorInfo*> outputTensorInfos = {};

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

108

109

// Build and create tensor infos using the sketch

110

const arm_compute::TensorInfo aclInputInfo = BuildArmComputeTensorInfo(input, descriptor.m_DataLayout);

111

arm_compute::TensorInfo aclWeightsInfo = BuildArmComputeTensorInfo(weights, descriptor.m_DataLayout);

112

aclWeightsInfo.set_are_values_constant(weights.IsConstant());

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

113

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

114

inputTensorInfos.emplace_back(workloadContext->create_tensor_info(aclInputInfo));

115

inputTensorInfos.emplace_back(workloadContext->create_tensor_info(aclWeightsInfo));

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

116

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

117

// Only create the bias tensor info if enabled, otherwise pass nullptr to validate_op / create_op

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

118

arm_compute::TensorInfo aclBiasInfo;

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

119

arm_compute::ITensorInfo* biasSketchInfoPtr = nullptr;

120

121

if (descriptor.m_BiasEnabled)

122

{

123

if(!biases.has_value())

124

{

125

throw InvalidArgumentException("GpuFsaConvolution2d::CreateOp: No biases set when biases are enabled");

126

}

127

aclBiasInfo = BuildArmComputeTensorInfo(biases.value(), descriptor.m_DataLayout);

128

aclBiasInfo.set_are_values_constant(biases.value().IsConstant());

129

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

130

inputTensorInfos.emplace_back(workloadContext->create_tensor_info(aclBiasInfo));

131

biasSketchInfoPtr = inputTensorInfos[2];

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

132

}

133

134

// Set Conv2d attributes using descriptor

135

const arm_compute::Size2D aclDilationInfo = BuildArmComputeSize2D(descriptor.m_DilationX,

136

descriptor.m_DilationY);

137

const arm_compute::Padding2D aclPadInfo = BuildArmComputePaddingInfo(descriptor);

138

const arm_compute::Size2D aclStrideInfo = BuildArmComputeSize2D(descriptor.m_StrideX, descriptor.m_StrideY);

139

140

Conv2dAttributes conv2DAttributes{};

141

conv2DAttributes.dilation(aclDilationInfo);

142

conv2DAttributes.pad(aclPadInfo);

143

conv2DAttributes.stride(aclStrideInfo);

144

145

// Validate operator, check status and update reasonIfUnsupported

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

146

arm_compute::Status aclStatus = GpuConv2d::validate_op(*sketch,

inputTensorInfos[0],

inputTensorInfos[1],

biasSketchInfoPtr,

conv2DAttributes);

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

151

152

const bool supported = (aclStatus.error_code() == arm_compute::ErrorCode::OK);

153

if (!supported)

154

{

155

throw BackendCapabilityException("\"GpuFsa\" backend failed during Convolution2D operation validation");

156

}

157

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

158

// Create the Op within the Sketch using the TensorInfos we have stored

159

arm_compute::ITensorInfo* convOutInfo = GpuConv2d::create_op(*sketch,

inputTensorInfos[0],

inputTensorInfos[1],

biasSketchInfoPtr,

conv2DAttributes);

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

164

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

165

// Create the Output

166

outputTensorInfos.emplace_back(workloadContext->create_tensor_info());

167

GpuOutput::create_op(*sketch, convOutInfo, outputTensorInfos[0]);

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

168

Orlaith Monahan

e1ac869

2024-01-23 13:52:30 +0000

[diff] [blame^]

169

// Store the TensorInfos within the blob as unique_ptrs to be used later

170

blob->inputTensorInfos = std::make_unique<std::vector<arm_compute::ITensorInfo*>>(inputTensorInfos);

171

blob->outputTensorInfos = std::make_unique<std::vector<arm_compute::ITensorInfo*>>(outputTensorInfos);

David Monahan

bd73808

2023-12-08 12:50:02 +0000

[diff] [blame]

172

}

173

174

} // namespace armnn