Blame - src/gpu/cl/operators/ClGemmConv2d.h - ml/ComputeLibrary

* Data type supported: Same as @p input or QASYMM8/QSYMM8_PER_CHANNEL when @p input is QASYMM8 or QASYMM8_SIGNED/QSYMM8_PER_CHANNEL when @p input is QASYMM8_SIGNED.

95

* @param[in] biases Biases tensor info. Shared biases supported. Biases are 1D tensor with dimensions [OFM].

96

* Data type supported: Should match @p input data type, except for input of quantized type where biases should be of S32 type.

97

* @param[out] dst Destination tensor info. 3 lower dimensions represent a single output [width, height, OFM], while the rest represent batch of outputs.

98

* Data types supported: Same as @p input.

99

* @param[in] conv2d_info Contains convolution 2d info described in @ref Conv2dInfo.

100

* @param[in] weights_info Specifies if the weights tensor has been reshaped with CLWeightsReshapeKernel. If this is not part of the fully connected layer the weights

101

* tensor has also been transposed with CLGEMMReshapeRHSMatrixKernel. Data type supported: Same as @p input.

102

*/

103

void configure(const ClCompileContext &compile_context, ITensorInfo *src, ITensorInfo *weights, ITensorInfo *biases, ITensorInfo *dst, const Conv2dInfo &conv2d_info,

104

const WeightsInfo &weights_info = WeightsInfo());

105

/** Static function to check if given info will lead to a valid configuration

106

*

107

* Similar to ClGemmConvolution::configure()

*

* @return a status

*/

static Status validate(const ITensorInfo *input, const ITensorInfo *weights, const ITensorInfo *biases, const ITensorInfo *output, const Conv2dInfo &conv2d_info,

112

const WeightsInfo &weights_info = WeightsInfo());

113

114

// Inherited methods overridden:

115

void run(ITensorPack &tensors) override;

116

void prepare(ITensorPack &constants) override;

117

experimental::MemoryRequirements workspace() const override;

118

119

private:

120

/** Configures the appropriate matrix multiply routine

121

*

122

* @param[in] compile_context The compile context to be used.

123

* @param[in] src Input tensor info. Data types supported: QASYMM8/QASYMM8_SIGNED/F16/F32.

124

* @param[in] weights Weights tensor info. Data type supported: Same as @p input or QASYMM8/QSYMM8_PER_CHANNEL when @p input is QASYMM8 or

125

* QASYMM8_SIGNED/QSYMM8_PER_CHANNEL when @p input is QASYMM8_SIGNED.

126

* @param[in] biases Biases tensor info. Shared biases supported. Biases are 1D tensor with dimensions [OFM].

127

* Data type supported: Should match @p input data type, except for input of quantized type where biases should be of S32 type.

128

* @param[in, out] dst Output tensor info. Data types supported: same as @p input.

129

* @param[in] gemmlowp_output_stage GEMMLowp output stage info

130

* @param[in] gemm_3d_depth Depth of GEMM 3D

131

* @param[in] act_info Activation to apply after the matrix multiplication

132

*/

133

void configure_mm(const CLCompileContext &compile_context, const ITensorInfo *src, ITensorInfo *weights, ITensorInfo *biases, ITensorInfo *dst,

134

const GEMMLowpOutputStageInfo &gemmlowp_output_stage,

135

int gemm_3d_depth, const ActivationLayerInfo &act_info);

136

/** Static function to check if given info will lead to a valid configuration of @ref CLGEMMConvolutionLayer matrix multiply routines

137

*

138

* @param[in] src Input tensor info. Data types supported: QASYMM8/QASYMM8_SIGNED/F16/F32.

139

* @param[in] weights Weights tensor info. Data type supported: Same as @p input or QASYMM8/QSYMM8_PER_CHANNEL when @p input is QASYMM8 or

140

* QASYMM8_SIGNED/QSYMM8_PER_CHANNEL when @p input is QASYMM8_SIGNED.

141

* @param[in] biases Biases tensor info. Shared biases supported. Biases are 1D tensor with dimensions [OFM].

142

* Data type supported: Should match @p input data type, except for input of quantized type where biases should be of S32 type.

143

* @param[in] dst Output tensor info. Data types supported: same as @p input.

144

* @param[in] gemmlowp_output_stage GEMMLowp output stage info

145

* @param[in] gemm_3d_depth Depth of GEMM 3D

146

* @param[in] skip_im2col Flag which specifies if im2col has to be skipped. i.e. 1x1 convolution with NHWC data layout.

147

* @param[in] act_info Activation to apply after the matrix multiplication

*

* @return a status

*/

static Status validate_mm(const ITensorInfo *src, const ITensorInfo *weights, const ITensorInfo *biases, const ITensorInfo *dst, const GEMMLowpOutputStageInfo &gemmlowp_output_stage,

152

int gemm_3d_depth, bool skip_im2col, const ActivationLayerInfo &act_info);

enum AuxTensorIdx

{

// ClGemmLowpMatrixMultiplyCore has up to 7 internal tensors

157

Im2ColOutput = 8,

158