Blame - src/cpu/operators/CpuGemm.h - ml/ComputeLibrary

2023-09-27 17:46:17 +0100

[diff] [blame]

97

void configure(const ITensorInfo *a,

98

const ITensorInfo *b,

99

const ITensorInfo *c,

ITensorInfo *d,

float alpha,

float beta,

const GEMMInfo &gemm_info = GEMMInfo());

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

104

/** Static function to check if given info will lead to a valid configuration of @ref CpuGemm.

105

*

106

* Similar to @ref CpuGemm::configure()

107

*

108

* @return a status

109

*/

Felix Thomasmathibalan

2023-09-27 17:46:17 +0100

[diff] [blame]

110

static Status validate(const ITensorInfo *a,

111

const ITensorInfo *b,

112

const ITensorInfo *c,

113

const ITensorInfo *d,

114

float alpha,

115

float beta,

116

const GEMMInfo &gemm_info = GEMMInfo());

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

117

Francesco Petrogalli

2022-06-30 10:22:01 +0000

[diff] [blame]

118

/** Indicates whether or not there is an optimal assembly implementation that can be used to process the given parameters.

119

*

120

* This method has the same use of @ref

121

* NEGEMMConvolutionLayer::has_opt_impl, with the only caveat that

Ramy Elgammal

9178002

2022-07-20 14:57:37 +0100

[diff] [blame]

122

* the value of arm_compute::WeightFormat need to be passed via the

Francesco Petrogalli

2022-06-30 10:22:01 +0000

[diff] [blame]

123

* parameter gemm_info.

124

*/

Felix Thomasmathibalan

2023-09-27 17:46:17 +0100

[diff] [blame]

125

static Status has_opt_impl(arm_compute::WeightFormat &weight_format,

126

const ITensorInfo *a,

127

const ITensorInfo *b,

128

const ITensorInfo *c,

129

const ITensorInfo *d,

130

const GEMMInfo &gemm_info = GEMMInfo());

Francesco Petrogalli

2022-06-30 10:22:01 +0000

[diff] [blame]

131

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

132

// Inherited methods overridden:

Felix Thomasmathibalan

2023-09-27 17:46:17 +0100

[diff] [blame]

133

void run(ITensorPack &tensors) override;

134

void prepare(ITensorPack &constants) override;

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

135

experimental::MemoryRequirements workspace() const override;

136

Francesco Petrogalli

2022-06-30 10:22:01 +0000

[diff] [blame]

137

/** Indicates if the convolution executes in variable weights mode.

138

*

139

* When ACL executes convolution in variable weights mode, it does

140

* not perform any processing of the weights tensor. Instead, it

141

* utilizes the data as it is given by the user.

142

*/

143

bool isVarWeightsKernel() const;

144

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

145

private:

146

enum AuxTensorIdx

147

{

SiCong Li

2023-10-17 17:38:57 +0100

[diff] [blame]

148

/* Slots 0 - 2 reserved for CpuGemmAssemblyDispatch */

149

InterleavedLHS = 3,

150

PreTransposedRHS,

151

Transposed1xWRHS,

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

TempResult,

Count

};

Felix Thomasmathibalan

2023-09-27 17:46:17 +0100

[diff] [blame]

156

std::unique_ptr<kernels::CpuGemmInterleave4x4Kernel> _interleave_kernel{nullptr};

SiCong Li

2023-10-17 17:38:57 +0100

[diff] [blame]

157

std::unique_ptr<CpuTranspose> _pretranspose_b_func{nullptr};

158

std::unique_ptr<kernels::CpuGemmTranspose1xWKernel> _transpose1xW_b_kernel{nullptr};

Felix Thomasmathibalan

2023-09-27 17:46:17 +0100

[diff] [blame]

159

std::unique_ptr<kernels::CpuGemmMatrixMultiplyKernel> _mm_kernel{nullptr};

160

std::unique_ptr<CpuGemmAssemblyDispatch> _asm_glue{nullptr};

161

std::unique_ptr<kernels::CpuGemmMatrixAdditionKernel> _ma_kernel{nullptr};

162

std::unique_ptr<CpuActivation> _alpha_scale_func{nullptr};

163

std::unique_ptr<CpuAdd> _add_bias{nullptr};

164

std::unique_ptr<CpuActivation> _activation_func{nullptr};

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

165

166

TensorInfo _tmp_a{};

SiCong Li

2023-10-17 17:38:57 +0100

[diff] [blame]

167

TensorInfo _pretransposed_b{};

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

168

TensorInfo _tmp_b{};

169

TensorInfo _tmp_d{};

170

Felix Thomasmathibalan

2023-09-27 17:46:17 +0100

[diff] [blame]

171

bool _run_vector_matrix_multiplication{false};

SiCong Li

2023-10-17 17:38:57 +0100

[diff] [blame]

172

bool _run_interleave_transpose{

173

true}; /**< If we run CpuGemmInterleave4x4Kernel on lhs and CpuGemmTranspose1xWKernel on rhs */

Felix Thomasmathibalan

2023-09-27 17:46:17 +0100

[diff] [blame]

174

bool _run_alpha_scale{false};

175

bool _run_addition{false};

176

bool _run_bias_addition{false};

177

bool _run_activation{false};

178

bool _reshape_b_only_on_first_run{false};

179

bool _is_prepared{false};

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

180

Felix Thomasmathibalan

2023-09-27 17:46:17 +0100

[diff] [blame]

181

experimental::MemoryRequirements _aux_mem{Count};

Michele Di Giorgio

2021-06-30 12:05:34 +0100

[diff] [blame]

182

};

183

} // namespace cpu

184

} // namespace arm_compute

SiCong Li