Blame - arm_compute/core/CL/kernels/CLGEMMLowpMatrixMultiplyReshapedOnlyRHSKernel.h - ml/ComputeLibrary

* @param[in] output_multipliers (Optional) Output multipliers tensor. In case of per-channel quantization, the number of multipliers must be equal to the number of filters (OFM).

72

* Supported data types: S32.

73

* @param[in] output_shifts (Optional) Output shifts tensor. In case of per-channel quantization, the number of multipliers must be equal to the number of filters (OFM).

74

* Supported data types: S32.

Gian Marco Iodice

62251f7

2019-03-11 16:07:12 +0000

[diff] [blame]

75

*/

Michele Di Giorgio

b54ba28

2020-01-14 15:31:55 +0000

[diff] [blame]

76

void configure(const ICLTensor *input0, const ICLTensor *input1, ICLTensor *output, const GEMMKernelInfo &gemm_info, const ICLTensor *vector_sum_col = nullptr,

77

const ICLTensor *vector_sum_row = nullptr, const ICLTensor *bias = nullptr, const ICLTensor *output_multipliers = nullptr, const ICLTensor *output_shifts = nullptr);

Manuel Bottini

4c6bd51

2020-04-08 10:15:51 +0100

[diff] [blame]

78

/** Initialise the kernel's input and output.

79

*

80

* @param[in] compile_context The compile context to be used.

81

* @param[in] input0 Input tensor containing the LHS matrix. Data type supported: QASYMM8/QASYMM8_SIGNED

82

* @param[in] input1 Input tensor containing the RHS reshaped matrix. Data type supported: same as @p input0

83

* @param[out] output Output tensor. Data type supported: QASYMM8/QASYMM8_SIGNED/S32.

84

* @param[in] gemm_info GEMM information used to retrieve the original dimensions of the input matrices, output stage information and RHS/LHS info.

85

* Only the following values are supported for LHS info:

86

* lhs_info.m0: 2,3,4,5,6,7,8

87

* lhs_info.k0: 2,3,4,8,16

88

* Only the following values are supported for RHS info:

89

* rhs_info.n0: 2,3,4,8,16

90

* rhs_info.k0: same as lhs_info.k0

91

* rhs_info.transpose: true

92

* @param[in] vector_sum_col (Optional) Input row-vector of sums of all the entries in each column of matrix B.

93

* Note: vector_sum_col can be a nullptr in case a_offset = 0. Data type supported: S32

94

* @param[in] vector_sum_row (Optional) Input row-vector of sums of all the entries in each row of matrix A.

95

* Note: vector_sum_row can be a nullptr in case b_offset = 0. Data type supported: S32

96

* @param[in] bias (Optional) Biases tensor. Only shared biases supported and it can be a nullptr if the addition of biases is not required.

97

* Biases are 1D tensor with dimensions [OFM]. Data type supported: S32.

98

* @param[in] output_multipliers (Optional) Output multipliers tensor. In case of per-channel quantization, the number of multipliers must be equal to the number of filters (OFM).

99

* Supported data types: S32.

100

* @param[in] output_shifts (Optional) Output shifts tensor. In case of per-channel quantization, the number of multipliers must be equal to the number of filters (OFM).

101

* Supported data types: S32.

102

*/

Manuel Bottini

679fc96

2020-04-21 16:08:53 +0100

[diff] [blame]

103

void configure(const CLCompileContext &compile_context, const ICLTensor *input0, const ICLTensor *input1, ICLTensor *output, const GEMMKernelInfo &gemm_info, const ICLTensor *vector_sum_col = nullptr,

Manuel Bottini

4c6bd51

2020-04-08 10:15:51 +0100

[diff] [blame]

104

const ICLTensor *vector_sum_row = nullptr, const ICLTensor *bias = nullptr, const ICLTensor *output_multipliers = nullptr, const ICLTensor *output_shifts = nullptr);

Gian Marco Iodice

62251f7

2019-03-11 16:07:12 +0000

[diff] [blame]

105

/** Static function to check if given info will lead to a valid configuration of @ref CLGEMMLowpMatrixMultiplyReshapedOnlyRHSKernel

106

*

Michele Di Giorgio

b54ba28

2020-01-14 15:31:55 +0000

[diff] [blame]

107

* @param[in] input0 Input tensor info for the LHS matrix. Data type supported: QASYMM8/QASYMM8_SIGNED

Michele Di Giorgio

1c1b3aa

2020-04-02 17:35:42 +0100

[diff] [blame]

108

* @param[in] input1 Input tensor info for the RHS reshaped matrix. Data type supported: QASYMM8/QASYMM8_SIGNED/QSYMM8/QSYMM8_PER_CHANNEL

Michele Di Giorgio

b54ba28

2020-01-14 15:31:55 +0000

[diff] [blame]

109

* @param[in] output Output tensor info. Data type supported: QASYMM8/QASYMM8_SIGNED/S32.

110

* @param[in] gemm_info GEMM information used to retrieve the original dimensions of the input matrices, output stage information and RHS/LHS info.

111

* Only the following values are supported for LHS info:

112

* lhs_info.m0: 2,3,4,5,6,7,8

113

* lhs_info.k0: 2,3,4,8,16

114

* Only the following values are supported for RHS info:

115

* rhs_info.n0: 2,3,4,8,16

116

* rhs_info.k0: same as lhs_info.k0

117

* rhs_info.transpose: true

118

* @param[in] vector_sum_col (Optional) Input row-vector info of sums of all the entries in each column of matrix B.

119

* Note: vector_sum_col can be a nullptr in case a_offset = 0. Data type supported: S32

120

* @param[in] vector_sum_row (Optional) Input row-vector info of sums of all the entries in each row of matrix A.

121

* Note: vector_sum_row can be a nullptr in case b_offset = 0. Data type supported: S32

122

* @param[in] bias (Optional) Biases tensor info. Only shared biases supported and it can be a nullptr if the addition of biases is not required.

123

* Biases are 1D tensor with dimensions [OFM]. Data type supported: S32.

124

* @param[in] output_multipliers (Optional) Output multipliers tensor info. In case of per-channel quantization, the number of multipliers must be equal to the number of filters (OFM).

125

* Supported data types: S32.

126

* @param[in] output_shifts (Optional) Output shifts tensor info. In case of per-channel quantization, the number of multipliers must be equal to the number of filters (OFM).

127

* Supported data types: S32.

Gian Marco Iodice

62251f7

2019-03-11 16:07:12 +0000

[diff] [blame]

128

*

129

* @return a status

130

*/

Michele Di Giorgio

b54ba28

2020-01-14 15:31:55 +0000

[diff] [blame]

131

static Status validate(const ITensorInfo *input0, const ITensorInfo *input1, const ITensorInfo *output, const GEMMKernelInfo &gemm_info, const ITensorInfo *vector_sum_col = nullptr,

132