Blame - src/gpu/cl/operators/ClMatMul.cpp - ml/ComputeLibrary

2023-03-24 11:42:03 +0000

[diff] [blame]

/*

*

* SPDX-License-Identifier: MIT

5

*

6

* Permission is hereby granted, free of charge, to any person obtaining a copy

7

* of this software and associated documentation files (the "Software"), to

8

* deal in the Software without restriction, including without limitation the

9

* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or

10

* sell copies of the Software, and to permit persons to whom the Software is

11

* furnished to do so, subject to the following conditions:

12

*

13

* The above copyright notice and this permission notice shall be included in all

14

* copies or substantial portions of the Software.

15

*

16

* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR

17

* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

18

* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE

19

* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

20

* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,

21

* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE

22

* SOFTWARE.

23

*/

24

#include "src/gpu/cl/operators/ClMatMul.h"

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

25

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

26

#include "arm_compute/core/Error.h"

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

27

#include "arm_compute/core/Utils.h"

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

28

#include "arm_compute/runtime/CL/CLScheduler.h"

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

29

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

30

#include "src/common/utils/Log.h"

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

31

#include "src/gpu/cl/kernels/ClMatMulLowpNativeKernel.h"

32

#include "src/gpu/cl/kernels/ClMatMulLowpNativeMMULKernel.h"

Jakub Sujak

1ed6a14

2023-04-13 21:14:42 +0100

[diff] [blame]

33

#include "src/gpu/cl/kernels/ClMatMulNativeKernel.h"

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

34

#include "src/gpu/cl/kernels/ClMatMulNativeMMULKernel.h"

Gian Marco Iodice

352c07d

2023-05-03 12:21:38 +0100

[diff] [blame]

35

#include "src/runtime/heuristics/matmul_native/ClMatMulNativeDefaultConfigValhall.h"

36

#include "src/runtime/heuristics/matmul_native/ClMatMulNativeKernelConfig.h"

37

#include "src/runtime/heuristics/matmul_native/IClMatMulNativeKernelConfig.h"

38

39

using namespace arm_compute::cl_matmul;

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

40

41

namespace arm_compute

42

{

43

namespace opencl

44

{

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

45

namespace

46

{

47

enum class MatMulKernelType

48

{

49

/** Native matrix multiplication for FP types */

50

NATIVE_FP,

51

52

/** Native matrix multiplication for quantized types */

53

NATIVE_QUANTIZED,

54

55

/** Native matrix multiplication using MMUL extension for FP types */

56

NATIVE_MMUL_FP,

57

58

/** Native matrix multiplication using MMUL extension for Quantized types */

59

NATIVE_MMUL_QUANTIZED

60

};

61

62

MatMulKernelType get_matmul_kernel(const ITensorInfo *lhs,

63

const ITensorInfo *rhs,

64

const MatMulInfo &matmul_info,

65

const ActivationLayerInfo &act_info)

66

{

67

ARM_COMPUTE_UNUSED(lhs, rhs, matmul_info, act_info);

68

69

const bool is_quantized = is_data_type_quantized_asymmetric(lhs->data_type());

70

const bool is_mmul_supported = arm_matrix_multiply_supported(CLKernelLibrary::get().get_device());

71

72

const int k = matmul_info.adj_lhs() ? lhs->tensor_shape().y() : lhs->tensor_shape().x();

if (is_quantized)

{

// MMUL kernel works only when K is a multiple of 16

77

if (is_mmul_supported && !act_info.enabled() && k % 16 == 0)

78

{

79

return MatMulKernelType::NATIVE_MMUL_QUANTIZED;

80

}

81

82

return MatMulKernelType::NATIVE_QUANTIZED;

}

else

{

// MMUL kernel works only when K is a multiple of 4

87

if (is_mmul_supported && !act_info.enabled() && k % 4 == 0)

88

{

89

return MatMulKernelType::NATIVE_MMUL_FP;

90

}

91

92

return MatMulKernelType::NATIVE_FP;

93

}

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

94

}

95

} // namespace

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

96

using namespace arm_compute::opencl::kernels;

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

97

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

98

ClMatMul::ClMatMul()

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

99

{

100

}

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

101

Felix Thomasmathibalan

afd38f0

2023-09-27 17:46:17 +0100

[diff] [blame]

102

Status ClMatMul::validate(const ITensorInfo *lhs,

103

const ITensorInfo *rhs,

104

const ITensorInfo *dst,

105

const MatMulInfo &matmul_info,

106

const ActivationLayerInfo &act_info)

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

107

{

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

108

ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR(lhs, rhs, dst);

Felix Thomasmathibalan

afd38f0

2023-09-27 17:46:17 +0100

[diff] [blame]

109

ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(lhs, 1, DataType::QASYMM8, DataType::QASYMM8_SIGNED,

110

DataType::F16, DataType::F32);

111

ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(rhs, 1, DataType::QASYMM8, DataType::QASYMM8_SIGNED,

112

DataType::F16, DataType::F32);

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

113

Gian Marco Iodice

352c07d

2023-05-03 12:21:38 +0100

[diff] [blame]

114

const GPUTarget gpu_target = CLScheduler::get().target();

115

116

std::unique_ptr<IClMatMulNativeKernelConfig> t = ClMatMulNativeKernelConfigurationFactory::create(gpu_target);

117

Mohammed Suhail Munshi

94abde4

2023-05-25 16:48:43 +0100

[diff] [blame]

118

const MatMulKernelInfo kernel_info = t->configure(lhs, rhs, matmul_info);

Gian Marco Iodice

352c07d

2023-05-03 12:21:38 +0100

[diff] [blame]

119

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

120

switch (get_matmul_kernel(lhs, rhs, matmul_info, act_info))

121

{

122

case MatMulKernelType::NATIVE_FP:

123

return ClMatMulNativeKernel::validate(lhs, rhs, nullptr /* bias */, dst, kernel_info, act_info);

124

case MatMulKernelType::NATIVE_MMUL_FP:

125

return ClMatMulNativeMMULKernel::validate(lhs, rhs, nullptr /* bias */, dst, kernel_info);

126

case MatMulKernelType::NATIVE_QUANTIZED:

127

return ClMatMulLowpNativeKernel::validate(lhs, rhs, nullptr /* bias */, dst, kernel_info, act_info);

128

case MatMulKernelType::NATIVE_MMUL_QUANTIZED:

129

return ClMatMulLowpNativeMMULKernel::validate(lhs, rhs, nullptr /* bias */, dst, kernel_info, act_info);

130

default:

131

ARM_COMPUTE_ERROR("Unsupported MatMul Kernel!");

132

}

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

133

}

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

134

Felix Thomasmathibalan

afd38f0

2023-09-27 17:46:17 +0100

[diff] [blame]

135

void ClMatMul::configure(const CLCompileContext &compile_context,

ITensorInfo *lhs,

ITensorInfo *rhs,

ITensorInfo *dst,

const MatMulInfo &matmul_info,

140

const ActivationLayerInfo &act_info)

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

141

{

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

142

ARM_COMPUTE_ERROR_ON_NULLPTR(lhs, rhs, dst);

143

ARM_COMPUTE_LOG_PARAMS(lhs, rhs, dst, matmul_info);

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

144

145

// Perform validation step

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

146

ARM_COMPUTE_ERROR_THROW_ON(validate(lhs, rhs, dst, matmul_info));

147

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

148

const GPUTarget gpu_target = CLScheduler::get().target();

149

const auto kernel_config = ClMatMulNativeKernelConfigurationFactory::create(gpu_target);

150

const MatMulKernelInfo kernel_info = kernel_config->configure(lhs, rhs, matmul_info);

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

151

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

152

switch (get_matmul_kernel(lhs, rhs, matmul_info, act_info))

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

153

{

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

154

case MatMulKernelType::NATIVE_FP:

155

{

156

auto kernel = std::make_unique<ClMatMulNativeKernel>();

157

kernel->set_target(gpu_target);

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

158

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

159

kernel->configure(compile_context, lhs, rhs, nullptr /* bias */, dst, kernel_info, act_info);

160

_matmul_kernel = std::move(kernel);

161

}

162

break;

163

case MatMulKernelType::NATIVE_MMUL_FP:

164

{

165

auto kernel = std::make_unique<ClMatMulNativeMMULKernel>();

166

kernel->set_target(gpu_target);

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

167

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

168

kernel->configure(compile_context, lhs, rhs, nullptr /* bias */, dst, kernel_info);

169

_matmul_kernel = std::move(kernel);

170

}

171

break;

172

case MatMulKernelType::NATIVE_QUANTIZED:

173

{

174

auto kernel = std::make_unique<ClMatMulLowpNativeKernel>();

175

kernel->set_target(gpu_target);

176

177

kernel->configure(compile_context, lhs, rhs, nullptr /* bias */, dst, kernel_info, act_info);

178

_matmul_kernel = std::move(kernel);

179

}

180

break;

181

case MatMulKernelType::NATIVE_MMUL_QUANTIZED:

182

{

183

auto kernel = std::make_unique<ClMatMulLowpNativeMMULKernel>();

184

kernel->set_target(gpu_target);

185

186

kernel->configure(compile_context, lhs, rhs, nullptr /* bias */, dst, kernel_info, act_info);

187

_matmul_kernel = std::move(kernel);

}

break;

default:

ARM_COMPUTE_ERROR("Unsupported MatMul Kernel!");

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

192

}

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

193

}

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

194

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

195

void ClMatMul::run(ITensorPack &tensors)

196

{

Gunes Bayir

2023-10-10 17:41:56 +0100

[diff] [blame]

197

CLScheduler::get().enqueue_op(*_matmul_kernel, tensors, /* flush */ true);

Ramy Elgammal

2023-03-24 11:42:03 +0000

[diff] [blame]

198

}

Jakub Sujak

2023-04-17 12:08:48 +0100

[diff] [blame]

199

Ramy Elgammal