Blame - arm_compute/runtime/NEON/functions/NEDepthwiseConvolutionLayer.h - ml/ComputeLibrary

2017-10-18 17:58:22 +0100

[diff] [blame]

1

/*

Georgios Pinitas

f72f936

2018-01-12 16:29:45 +0000

[diff] [blame]

2

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

3

*

4

* SPDX-License-Identifier: MIT

5

*

6

* Permission is hereby granted, free of charge, to any person obtaining a copy

7

* of this software and associated documentation files (the "Software"), to

8

* deal in the Software without restriction, including without limitation the

9

* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or

10

* sell copies of the Software, and to permit persons to whom the Software is

11

* furnished to do so, subject to the following conditions:

12

*

13

* The above copyright notice and this permission notice shall be included in all

14

* copies or substantial portions of the Software.

15

*

16

* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

17

* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

18

* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE

19

* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

20

* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,

21

* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE

22

* SOFTWARE.

23

*/

24

#ifndef __ARM_COMPUTE_NEDEPTHWISECONVOLUTION_H__

25

#define __ARM_COMPUTE_NEDEPTHWISECONVOLUTION_H__

26

Giorgio Arena

2017-11-23 11:45:24 +0000

[diff] [blame]

27

#include "arm_compute/core/NEON/kernels/NEDepthwiseConvolutionLayer3x3Kernel.h"

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

28

#include "arm_compute/core/NEON/kernels/NEDepthwiseIm2ColKernel.h"

29

#include "arm_compute/core/NEON/kernels/NEDepthwiseVectorToTensorKernel.h"

30

#include "arm_compute/core/NEON/kernels/NEDepthwiseWeightsReshapeKernel.h"

Michalis Spyrou

b91e34c

2017-12-20 15:50:55 +0000

[diff] [blame]

31

#include "arm_compute/core/NEON/kernels/NEDirectConvolutionLayerOutputStageKernel.h"

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

32

#include "arm_compute/core/NEON/kernels/NEFillBorderKernel.h"

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

33

#include "arm_compute/core/NEON/kernels/NEGEMMMatrixVectorMultiplyKernel.h"

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

34

#include "arm_compute/core/Types.h"

35

#include "arm_compute/runtime/IFunction.h"

36

#include "arm_compute/runtime/IMemoryManager.h"

37

#include "arm_compute/runtime/MemoryGroup.h"

Georgios Pinitas

284cfe2

2018-02-13 12:15:13 +0000

[diff] [blame]

38

#include "arm_compute/runtime/NEON/functions/NEPermute.h"

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

39

#include "arm_compute/runtime/Tensor.h"

40

41

namespace arm_compute

{

class ITensor;

/** Basic function to execute a depthwise convolution for kernel size 3x3xC. This function calls the following NEON kernels:

46

*

Giorgio Arena

2017-11-23 11:45:24 +0000

[diff] [blame]

47

* -# @ref NEDepthwiseConvolutionLayer3x3

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

48

* -# @ref NEFillBorderKernel (if pad_x or pad_y > 0)

49

*

50

*/

Giorgio Arena

2017-11-23 11:45:24 +0000

[diff] [blame]

51

class NEDepthwiseConvolutionLayer3x3 : public IFunction

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

52

{

53

public:

54

/** Default constructor */

Giorgio Arena

2017-11-23 11:45:24 +0000

[diff] [blame]

55

NEDepthwiseConvolutionLayer3x3();

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

56

/** Initialize the function's source, destination, kernels and border_size.

57

*

Georgios Pinitas

2018-01-22 16:29:17 +0000

[diff] [blame]

58

* @param[in, out] input Source tensor. Data type supported: QASYMM8/F32. (Written to only for border filling).

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

59

* @param[in] weights Weights tensor. These are 3D tensors with shape [3, 3, IFM]. Data type supported: Same as @p input.

60

* @param[in] biases (Optional) Biases tensor. A 1D tensor with shape [IFM]. Must be nullptr if not needed.

61

* Data type supported: Same as @p input.

Giorgio Arena

82afedf

2017-11-15 13:36:15 +0000

[diff] [blame]

62

* @param[out] output Destination tensor. Data type supported: same as @p input.

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

63

* @param[in] conv_info Padding and stride information to use for the convolution.

64

*/

Giorgio Arena

82afedf

2017-11-15 13:36:15 +0000

[diff] [blame]

65

void configure(ITensor *input, const ITensor *weights, const ITensor *biases, ITensor *output, const PadStrideInfo &conv_info);

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

66

67

// Inherited methods overriden:

68

void run() override;

69

70

private:

Georgios Pinitas

4074c99

2018-01-30 18:13:46 +0000

[diff] [blame]

71

NEDepthwiseConvolutionLayer3x3Kernel _dwc_kernel;

Michalis Spyrou

b91e34c

2017-12-20 15:50:55 +0000

[diff] [blame]

72

NEDirectConvolutionLayerOutputStageKernel _output_stage_kernel;

73

NEFillBorderKernel _border_handler;

Georgios Pinitas

284cfe2

2018-02-13 12:15:13 +0000

[diff] [blame]

74

NEPermute _permute_input;

75

NEPermute _permute_weights;

76

NEPermute _permute_output;

Georgios Pinitas

f72f936

2018-01-12 16:29:45 +0000

[diff] [blame]

77

Tensor _accumulator;

Georgios Pinitas

4074c99

2018-01-30 18:13:46 +0000

[diff] [blame]

78

Tensor _input_nhwc;

79

Tensor _weights_hwio;

80

Tensor _output_nhwc;

Michalis Spyrou

b91e34c

2017-12-20 15:50:55 +0000

[diff] [blame]

81

bool _has_bias;

Georgios Pinitas

f72f936

2018-01-12 16:29:45 +0000

[diff] [blame]

82

bool _is_quantized;

Georgios Pinitas

4074c99

2018-01-30 18:13:46 +0000

[diff] [blame]

83

bool _is_optimized;

84

bool _are_weights_reshaped;

Giorgio Arena

1ed1fc6

2018-03-26 16:20:05 +0100

[diff] [blame]

85

bool _is_nchw;

86

bool _is_first_run;

Michalis Spyrou

2017-10-18 17:58:22 +0100

[diff] [blame]

87

};

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

88

Giorgio Arena

3972528

2017-12-12 15:04:43 +0000

[diff] [blame]

89

/** Basic function to execute a generic depthwise convolution. This function calls the following NEON kernels:

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

90

*

91

* -# @ref NEDepthwiseIm2ColKernel

92

* -# @ref NEDepthwiseWeightsReshapeKernel

93

* -# @ref NEGEMMMatrixVectorMultiplyKernel

94

* -# @ref NEFillBorderKernel (if pad_x or pad_y > 0)

95

*

96

*/

Giorgio Arena

2017-11-23 11:45:24 +0000

[diff] [blame]

97

class NEDepthwiseConvolutionLayer : public IFunction

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

98

{

99

public:

100

/** Default constructor */

Giorgio Arena

2017-11-23 11:45:24 +0000

[diff] [blame]

101

NEDepthwiseConvolutionLayer();

Georgios Pinitas

1562be3

2018-03-08 19:09:19 +0000

[diff] [blame]

102

/** Prevent instances of this class from being copied (As this class contains pointers) */

103

NEDepthwiseConvolutionLayer(const NEDepthwiseConvolutionLayer &) = delete;

104

/** Default move constructor */

105

NEDepthwiseConvolutionLayer(NEDepthwiseConvolutionLayer &&) = default;

106

/** Prevent instances of this class from being copied (As this class contains pointers) */

107

NEDepthwiseConvolutionLayer &operator=(const NEDepthwiseConvolutionLayer &) = delete;

108

/** Default move assignment operator */

109

NEDepthwiseConvolutionLayer &operator=(NEDepthwiseConvolutionLayer &&) = default;

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

110

/** Initialize the function's source, destination, weights and convolution information.

111

*

Georgios Pinitas

2018-01-22 16:29:17 +0000

[diff] [blame]

112

* @param[in, out] input Source tensor. Data type supported: QASYMM8/F32. (Written to only for border filling).

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

113

* @param[out] output Destination tensor. Data type supported: same as @p input.

114

* @param[in] weights Weights tensor. These are 3D tensors with shape [kernel_x, kernel_y, IFM]. Data type supported: Same as @p input.

115

* @param[in] biases (Optional) Biases tensor. A 1D tensor with shape [IFM]. Must be nullptr if not needed.

Georgios Pinitas

de5a1cc

2018-02-02 12:52:07 +0000

[diff] [blame]

116

* Data type supported: Same as @p input, S32 when input is QASYMM8.

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

117

* @param[in] conv_info Padding and stride information to use for the convolution.

118

*/

119

void configure(ITensor *input, const ITensor *weights, const ITensor *biases, ITensor *output, const PadStrideInfo &conv_info);

120

121

// Inherited methods overriden:

122

void run() override;

123

124

private:

Georgios Pinitas

2018-01-22 16:29:17 +0000

[diff] [blame]

125

NEDepthwiseIm2ColKernel _im2col_kernel;

126

NEDepthwiseWeightsReshapeKernel _weights_reshape_kernel;

127

NEGEMMMatrixVectorMultiplyKernel _v2mm_kernel;

128

NEDepthwiseVectorToTensorKernel _vector_to_tensor_kernel;

129

NEDirectConvolutionLayerOutputStageKernel _output_stage_kernel;

130

NEFillBorderKernel _v2mm_input_fill_border;

131

NEFillBorderKernel _v2mm_weights_fill_border;

132

Tensor _input_reshaped;

133

Tensor _weights_reshaped;

134

Tensor _v2mm_output;

135

Tensor _output_reshaped;

Georgios Pinitas

1562be3

2018-03-08 19:09:19 +0000

[diff] [blame]

136

bool _is_first_run;

Georgios Pinitas

2018-01-22 16:29:17 +0000

[diff] [blame]

137

bool _is_quantized;

Georgios Pinitas

1562be3

2018-03-08 19:09:19 +0000

[diff] [blame]

138

const ITensor *_original_weights;

Michalis Spyrou

2017-11-23 12:10:21 +0000

[diff] [blame]

139

};

Michalis Spyrou