Blame - arm_compute/graph/backends/FusedConvolutionBatchNormalizationFunction.h - ml/ComputeLibrary

* @param[out] output Destination tensor. 3 lower dimensions represent a single output [width, height, OFM], while the rest represent batch of outputs.

59

* Data types supported: Same as @p input.

60

* @param[in] mean Mean values tensor. 1 dimension with size equal to the feature maps [FM]. Data types supported: Same as @p input

61

* @param[in] var Variance values tensor. 1 dimension with size equal to the feature maps [FM]. Data types supported: Same as @p input

62

* @param[in] beta Beta values tensor info. 1 dimension with size equal to the feature maps [FM]. If not provided, default value for beta is 0. Data types supported: Same as @p input

63

* @param[in] gamma Gamma values tensor info. 1 dimension with size equal to the feature maps [FM]. If not provided, default value for gamma is 1. Data types supported: Same as @p input

64

* @param[in] epsilon Small value to avoid division with zero. Default value is 0.001f.

65

* @param[in] conv_info Contains padding and stride information described in @ref PadStrideInfo.

66

* @param[in] num_groups Number of groups when performing a grouped convolution. num_groups != 1 is only supported for NCHW data layout

67

* @param[in] fast_math Enable fast math computation. In case this flag were set, the function could dispatch the fastest implementation

68

* available which may introduce a drop of accuracy as well. Default is false

69

* @param[in] fused_act Activation layer information in case of a fused activation.

70

*

71

*/

72

void configure(TensorType *input,

TensorType *weights,

TensorType *bias,

TensorType *output,

const TensorType *mean,

77

const TensorType *var,

78

const TensorType *beta,

79

const TensorType *gamma,

80

float epsilon, const PadStrideInfo &conv_info, unsigned int num_groups, bool fast_math, ActivationLayerInfo const &fused_act)

81

{

82

// We don't run any validate, as we assume that the layers have been already validated

83

const bool has_bias = (bias != nullptr);

84

const TensorType *bias_to_use;

85

86

// We check if the layer has a bias. If yes, use it in-place. If not, we need to create one

87

// as batch normalization might end up with a bias != 0

88

if(has_bias)

89

{

90

_fused_batch_norm_layer.configure(weights, mean, var, nullptr, nullptr, bias, beta, gamma, epsilon);

bias_to_use = bias;

}

else

{

_fused_batch_norm_layer.configure(weights, mean, var, nullptr, &_fused_bias, nullptr, beta, gamma, epsilon);

96

bias_to_use = &_fused_bias;

97

}

98

99

_conv_layer.configure(input, weights, bias_to_use, output, conv_info, WeightsInfo(), Size2D(1U, 1U), fused_act, fast_math, num_groups);

if(!has_bias)

{

_fused_bias.allocator()->allocate();

}

}

// Inherited methods overridden:

void run()

{

prepare();

_conv_layer.run();

}

void prepare()

{

if(!_is_prepared)

{

_fused_batch_norm_layer.run();

_is_prepared = true;

}

}

private:

typename FusedLayerTypes::ConvolutionLayer _conv_layer;

125

typename FusedLayerTypes::FuseBatchNormalization _fused_batch_norm_layer;

126

TensorConcreteType _fused_bias;

127

bool _is_prepared;

128

};

129

} // namespace backends

130

} // namespace graph

131

} // namespace arm_compute

132

133

#endif /* __ARM_COMPUTE_GRAPH_BACKENDS_FUSED_CONVOLUTION_BATCH_NORMAZLIZATION_FUNCTION_H__ */