Blame - arm_compute/runtime/NEON/functions/NEDepthwiseConvolutionLayer.h - ml/ComputeLibrary

static Status validate(const ITensorInfo *input, const ITensorInfo *weights, const ITensorInfo *biases, const ITensorInfo *output, const PadStrideInfo &conv_info,

Usama Arif

e73686a

2019-04-08 17:30:48 +0100

[diff] [blame]

102

unsigned int depth_multiplier = 1, const ActivationLayerInfo &act_info = ActivationLayerInfo(), const Size2D &dilation = Size2D(1U, 1U));

Abe Mbise

7784c83

2018-05-31 16:48:41 +0100

[diff] [blame]

103

Michalis Spyrou

7362f0d

2017-10-18 17:58:22 +0100

[diff] [blame]

104

// Inherited methods overriden:

105

void run() override;

Georgios Pinitas

47d39dc

2019-03-11 14:03:23 +0000

[diff] [blame]

106

void prepare() override;

Michalis Spyrou

7362f0d

2017-10-18 17:58:22 +0100

[diff] [blame]

107

108

private:

Michele Di Giorgio

33f41fa

2021-03-09 14:09:08 +0000

[diff] [blame]

109

/** Basic function to execute optimized depthwise convolution routines. This function calls the following kernels:

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

110

*

111

* @note At the moment 3x3 and 5x5 convolution of stride 1, 2 are supported

112

*

113

* -# @ref NEFillBorderKernel (if pad_x or pad_y > 0) and no assembly kernel implementation is present

114

* -# @ref NEDepthwiseConvolutionLayer3x3Kernel if 3x3 and no assembly kernel implementation is present

115

* -# @ref NEDepthwiseConvolutionAssemblyDispatch if assembly kernel implementation is present

116

* -# @ref NEDirectConvolutionLayerOutputStageKernel if re-quantization of output is required

117

* -# @ref NEActivationLayer if fused activation is required

118

*

119

*/

120

class NEDepthwiseConvolutionLayerOptimizedInternal : public IFunction

121

{

122

public:

123

/** Default constructor */

124

NEDepthwiseConvolutionLayerOptimizedInternal(std::shared_ptr<IMemoryManager> memory_manager = nullptr);

125

/** Prevent instances of this class from being copied (As this class contains pointers) */

126

NEDepthwiseConvolutionLayerOptimizedInternal(const NEDepthwiseConvolutionLayerOptimizedInternal &) = delete;

127

/** Default move constructor */

128

NEDepthwiseConvolutionLayerOptimizedInternal(NEDepthwiseConvolutionLayerOptimizedInternal &&) = default;

129

/** Prevent instances of this class from being copied (As this class contains pointers) */

130

NEDepthwiseConvolutionLayerOptimizedInternal &operator=(const NEDepthwiseConvolutionLayerOptimizedInternal &) = delete;

131

/** Default move assignment operator */

132

NEDepthwiseConvolutionLayerOptimizedInternal &operator=(NEDepthwiseConvolutionLayerOptimizedInternal &&) = default;

Michalis Spyrou

ebcebf1

2020-10-21 00:04:14 +0100

[diff] [blame]

133

/** Default destructor */

134

~NEDepthwiseConvolutionLayerOptimizedInternal() = default;

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

135

/** Initialize the function's source, destination, kernels and border_size.

136

*

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

137

* @param[in, out] input Source tensor. Data type supported: QASYMM8/QASYMM8_SIGNED/F16/F32. (Written to only for border filling).

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

138

* @param[in] weights Weights tensor. These are 3D tensors with shape [kernel_x, kernel_y, IFM]. Data type supported: Same as @p input.

139

* @param[in] biases Biases tensor. A 1D tensor with shape [IFM]. Must be nullptr if not needed.

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

140

* Data type supported: Same as @p input, S32 when input is QASYMM8/QASYMM8_SIGNED.

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

141

* @param[out] output Destination tensor. Data type supported: same as @p input.

142

* @param[in] conv_info Padding and stride information to use for the convolution.

143

* @param[in] depth_multiplier (Optional) Multiplier to apply to the input's depth in order to retrieve the output's depth. Defaults to 1.

144

* @param[in] act_info (Optional) Activation layer information in case of a fused activation.

145

* @param[in] dilation (Optional) Dilation, in elements, across x and y. Defaults to (1, 1).

146

*/

147

void configure(ITensor *input, const ITensor *weights, const ITensor *biases, ITensor *output, const PadStrideInfo &conv_info,

148

unsigned int depth_multiplier = 1, const ActivationLayerInfo &act_info = ActivationLayerInfo(), const Size2D &dilation = Size2D(1U, 1U));

149

150

/** Static function to check if given info will lead to a valid configuration of @ref NEDepthwiseConvolutionLayer3x3

151

*

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

152

* @param[in] input Source tensor. Data type supported: QASYMM8/QASYMM8_SIGNED/F16/F32. (Written to only for border filling).

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

153

* @param[in] weights Weights tensor. These are 3D tensors with shape [kernel_x, kernel_y, IFM]. Data type supported: Same as @p input.

154

* @param[in] biases Biases tensor. A 1D tensor with shape [IFM]. Must be nullptr if not needed.

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

155

* Data type supported: Same as @p input, S32 when input is QASYMM8/QASYMM8_SIGNED.

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

156

* @param[in] output Destination tensor. Data type supported: same as @p input.

157

* @param[in] conv_info Padding and stride information to use for the convolution.

158

* @param[in] depth_multiplier (Optional) Multiplier to apply to the input's depth in order to retrieve the output's depth. Defaults to 1.

159

* @param[in] act_info (Optional) Activation layer information in case of a fused activation.

160

* @param[in] dilation (Optional) Dilation, in elements, across x and y. Defaults to (1, 1).

*

* @return a status

*/

static Status validate(const ITensorInfo *input, const ITensorInfo *weights, const ITensorInfo *biases, const ITensorInfo *output, const PadStrideInfo &conv_info,

165

unsigned int depth_multiplier = 1, const ActivationLayerInfo &act_info = ActivationLayerInfo(), const Size2D &dilation = Size2D(1U, 1U));

166

167

// Inherited methods overriden:

168

void run() override;

169

void prepare() override;

170

171

private:

Michalis Spyrou

60c3b0e

2021-04-08 12:02:58 +0100

[diff] [blame]

172

MemoryGroup _memory_group;

173

struct Impl;

174

std::unique_ptr<Impl> _impl;

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

175

};

176

Michele Di Giorgio

33f41fa

2021-03-09 14:09:08 +0000

[diff] [blame]

177

/** Basic function to execute a generic depthwise convolution. This function calls the following kernel:

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

178

*

179

* -# @ref NEDepthwiseConvolutionLayerNativeKernel

180

*

181

*/

182

class NEDepthwiseConvolutionLayerGeneric : public IFunction

183

{

184

public:

185

/** Default constructor */

186

NEDepthwiseConvolutionLayerGeneric();

187

/** Prevent instances of this class from being copied (As this class contains pointers) */

188

NEDepthwiseConvolutionLayerGeneric(const NEDepthwiseConvolutionLayerGeneric &) = delete;

189

/** Default move constructor */

190

NEDepthwiseConvolutionLayerGeneric(NEDepthwiseConvolutionLayerGeneric &&) = default;

191

/** Prevent instances of this class from being copied (As this class contains pointers) */

192

NEDepthwiseConvolutionLayerGeneric &operator=(const NEDepthwiseConvolutionLayerGeneric &) = delete;

193

/** Default move assignment operator */

194

NEDepthwiseConvolutionLayerGeneric &operator=(NEDepthwiseConvolutionLayerGeneric &&) = default;

Michalis Spyrou

ebcebf1

2020-10-21 00:04:14 +0100

[diff] [blame]

195

/** Default destructor */

196

~NEDepthwiseConvolutionLayerGeneric() = default;

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

197

/** Initialize the function's source, destination, weights and convolution information.

198

*

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

199

* @param[in, out] input Source tensor. Data type supported: QASYMM8/QASYMM8_SIGNED/F16/F32. (Written to only for border filling).

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

200

* @param[out] output Destination tensor. Data type supported: same as @p input.

Michele Di Giorgio

df4cf57

2019-10-09 15:32:39 +0100

[diff] [blame]

201

* @param[in] weights Weights tensor. These are 3D tensors with shape [kernel_x, kernel_y, IFM].

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

202

* Data type supported: Same as @p input or QASYMM8/QASYMM8_SIGNED/QSYMM8_PER_CHANNEL when @p input is QASYMM8/QASYMM8_SIGNED.

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

203

* @param[in] biases Biases tensor. A 1D tensor with shape [IFM]. Must be nullptr if not needed.

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

204

* Data type supported: Same as @p input, S32 when input is QASYMM8/QASYMM8_SIGNED.

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

205

* @param[in] conv_info Padding and stride information to use for the convolution.

206

* @param[in] depth_multiplier (Optional) Multiplier to apply to the input's depth in order to retrieve the output's depth. Defaults to 1.

207

* @param[in] act_info (Optional) Activation layer information in case of a fused activation.

208

* @param[in] dilation (Optional) Dilation, in elements, across x and y. Defaults to (1, 1).

209

*/

210

void configure(ITensor *input, const ITensor *weights, const ITensor *biases, ITensor *output, const PadStrideInfo &conv_info,

211

unsigned int depth_multiplier = 1, const ActivationLayerInfo &act_info = ActivationLayerInfo(), const Size2D &dilation = Size2D(1U, 1U));

212

213

/** Static function to check if given info will lead to a valid configuration of @ref NEDepthwiseConvolutionLayerGeneric

214

*

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

215

* @param[in] input Source tensor. Data type supported: QASYMM8/QASYMM8_SIGNED/F16/F32. (Written to only for border filling).

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

216

* @param[in] output Destination tensor. Data type supported: same as @p input.

Michele Di Giorgio

df4cf57

2019-10-09 15:32:39 +0100

[diff] [blame]

217

* @param[in] weights Weights tensor. These are 3D tensors with shape [kernel_x, kernel_y, IFM].

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

218

* Data type supported: Same as @p input or QASYMM8/QASYMM8_SIGNED/QSYMM8_PER_CHANNEL when @p input is QASYMM8/QASYMM8_SIGNED.

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

219

* @param[in] biases Biases tensor. A 1D tensor with shape [IFM]. Must be nullptr if not needed.

Michele Di Giorgio

8c837ca

2020-01-07 15:06:41 +0000

[diff] [blame]

220

* Data type supported: Same as @p input, S32 when input is QASYMM8/QASYMM8_SIGNED.

Manuel Bottini

05069f0

2019-09-26 17:18:26 +0100

[diff] [blame]

221

* @param[in] conv_info Padding and stride information to use for the convolution.

222

* @param[in] depth_multiplier (Optional) Multiplier to apply to the input's depth in order to retrieve the output's depth. Defaults to 1.

223

* @param[in] act_info (Optional) Activation layer information in case of a fused activation.

224

* @param[in] dilation (Optional) Dilation, in elements, across x and y. Defaults to (1, 1).

*

* @return a status

*/

static Status validate(const ITensorInfo *input, const ITensorInfo *weights, const ITensorInfo *biases, const ITensorInfo *output, const PadStrideInfo &conv_info,

229