Blame - src/gpu/cl/operators/ClGemmConv2d.h - ml/ComputeLibrary

* Data type supported: Same as @p input or QASYMM8/QSYMM8_PER_CHANNEL when @p input is QASYMM8 or QASYMM8_SIGNED/QSYMM8_PER_CHANNEL when @p input is QASYMM8_SIGNED.

96

* @param[in] biases Biases tensor info. Shared biases supported. Biases are 1D tensor with dimensions [OFM].

97

* Data type supported: Should match @p input data type, except for input of quantized type where biases should be of S32 type.

98

* @param[out] dst Destination tensor info. 3 lower dimensions represent a single output [width, height, OFM], while the rest represent batch of outputs.

99

* Data types supported: Same as @p input.

100

* @param[in] conv2d_info Contains convolution 2d info described in @ref Conv2dInfo.

101

* @param[in] weights_info Specifies if the weights tensor has been reshaped with CLWeightsReshapeKernel. If this is not part of the fully connected layer the weights

102

* tensor has also been transposed with CLGEMMReshapeRHSMatrixKernel. Data type supported: Same as @p input.

103

*/

Felix Thomasmathibalan

afd38f0

2023-09-27 17:46:17 +0100

[diff] [blame]

104

void configure(const ClCompileContext &compile_context,

105

ITensorInfo *src,

106

ITensorInfo *weights,

107

ITensorInfo *biases,

108

ITensorInfo *dst,

109

const Conv2dInfo &conv2d_info,

110

const WeightsInfo &weights_info = WeightsInfo());

Manuel Bottini

d87aded

2021-07-16 10:23:31 +0100

[diff] [blame]

111

/** Static function to check if given info will lead to a valid configuration

112

*

113

* Similar to ClGemmConvolution::configure()

114

*

115

* @return a status

116

*/

Felix Thomasmathibalan

afd38f0

2023-09-27 17:46:17 +0100

[diff] [blame]

117

static Status validate(const ITensorInfo *input,

118

const ITensorInfo *weights,

119

const ITensorInfo *biases,

120

const ITensorInfo *output,

121

const Conv2dInfo &conv2d_info,

Manuel Bottini

d87aded

2021-07-16 10:23:31 +0100

[diff] [blame]

122

const WeightsInfo &weights_info = WeightsInfo());

123

124

// Inherited methods overridden:

Jakub Sujak

0d27b2e

2023-08-24 14:01:20 +0100

[diff] [blame]

125

void run(ITensorPack &tensors) override;

126

void prepare(ITensorPack &constants) override;

Manuel Bottini

d87aded

2021-07-16 10:23:31 +0100

[diff] [blame]

127

experimental::MemoryRequirements workspace() const override;

128

129

private:

130

/** Configures the appropriate matrix multiply routine

131

*

132

* @param[in] compile_context The compile context to be used.

133

* @param[in] src Input tensor info. Data types supported: QASYMM8/QASYMM8_SIGNED/F16/F32.

134

* @param[in] weights Weights tensor info. Data type supported: Same as @p input or QASYMM8/QSYMM8_PER_CHANNEL when @p input is QASYMM8 or

135

* QASYMM8_SIGNED/QSYMM8_PER_CHANNEL when @p input is QASYMM8_SIGNED.

136

* @param[in] biases Biases tensor info. Shared biases supported. Biases are 1D tensor with dimensions [OFM].

137

* Data type supported: Should match @p input data type, except for input of quantized type where biases should be of S32 type.

138

* @param[in, out] dst Output tensor info. Data types supported: same as @p input.

139

* @param[in] gemmlowp_output_stage GEMMLowp output stage info

140

* @param[in] gemm_3d_depth Depth of GEMM 3D

141

* @param[in] act_info Activation to apply after the matrix multiplication

142

*/

Felix Thomasmathibalan

afd38f0

2023-09-27 17:46:17 +0100

[diff] [blame]

143

void configure_mm(const CLCompileContext &compile_context,

144

const ITensorInfo *src,

145

ITensorInfo *weights,

146

ITensorInfo *biases,

147

ITensorInfo *dst,

Manuel Bottini

d87aded

2021-07-16 10:23:31 +0100

[diff] [blame]

148

const GEMMLowpOutputStageInfo &gemmlowp_output_stage,

Felix Thomasmathibalan

afd38f0

2023-09-27 17:46:17 +0100

[diff] [blame]

149

int gemm_3d_depth,

150

const ActivationLayerInfo &act_info);

Manuel Bottini

d87aded

2021-07-16 10:23:31 +0100

[diff] [blame]

151

/** Static function to check if given info will lead to a valid configuration of @ref CLGEMMConvolutionLayer matrix multiply routines

152

*

153

* @param[in] src Input tensor info. Data types supported: QASYMM8/QASYMM8_SIGNED/F16/F32.

154

* @param[in] weights Weights tensor info. Data type supported: Same as @p input or QASYMM8/QSYMM8_PER_CHANNEL when @p input is QASYMM8 or

155

* QASYMM8_SIGNED/QSYMM8_PER_CHANNEL when @p input is QASYMM8_SIGNED.

156

* @param[in] biases Biases tensor info. Shared biases supported. Biases are 1D tensor with dimensions [OFM].

157

* Data type supported: Should match @p input data type, except for input of quantized type where biases should be of S32 type.

158

* @param[in] dst Output tensor info. Data types supported: same as @p input.

159

* @param[in] gemmlowp_output_stage GEMMLowp output stage info

160

* @param[in] gemm_3d_depth Depth of GEMM 3D

161

* @param[in] skip_im2col Flag which specifies if im2col has to be skipped. i.e. 1x1 convolution with NHWC data layout.

162

* @param[in] act_info Activation to apply after the matrix multiplication

163

*

164

* @return a status

165

*/

Felix Thomasmathibalan

afd38f0

2023-09-27 17:46:17 +0100

[diff] [blame]

166

static Status validate_mm(const ITensorInfo *src,

167

const ITensorInfo *weights,

168

const ITensorInfo *biases,

169

const ITensorInfo *dst,

170

const GEMMLowpOutputStageInfo &gemmlowp_output_stage,

171

int gemm_3d_depth,

172

bool skip_im2col,

173

const ActivationLayerInfo &act_info);

Manuel Bottini

d87aded

2021-07-16 10:23:31 +0100

[diff] [blame]

enum AuxTensorIdx

{

// ClGemmLowpMatrixMultiplyCore has up to 7 internal tensors

Im2ColOutput = 8,

WeightsReshaped,

GemmOutput,

Count

};

std::unique_ptr<kernels::ClWeightsReshapeKernel> _weights_reshape_kernel;

185

std::unique_ptr<kernels::ClIm2ColKernel> _im2col_kernel;

186

std::unique_ptr<ClGemm> _mm_gemm;

187

std::unique_ptr<ClGemmLowpMatrixMultiplyCore> _mm_gemmlowp;

188

std::unique_ptr<opencl::kernels::ClCol2ImKernel> _col2im_kernel;

189

std::unique_ptr<kernels::ClActivationKernel> _activation_kernel;

190

191

TensorInfo _im2col_output;

192

TensorInfo _weights_reshaped;

193

TensorInfo _gemm_output;

bool _skip_im2col;

bool _skip_col2im;

bool _is_quantized;

bool _fuse_activation;

bool _append_bias;

bool _is_prepared;

experimental::MemoryRequirements _aux_mem;

203

};

204

} // namespace opencl

205

} // namespace arm_compute

Jakub Sujak

0d27b2e

2023-08-24 14:01:20 +0100

[diff] [blame]

206

#endif // ACL_SRC_GPU_CL_OPERATORS_CLGEMMCONV2D_H