Blame - tests/validation/CL/GEMMMatrixMultiplyInterleavedTransposed.cpp - ml/ComputeLibrary

GEMMMatrixMultiplyInterleavedTransposedValidationFixture<CLTensor, CLAccessor, T, CLGEMMReshapeLHSMatrix, CLGEMMReshapeRHSMatrix, CLGEMMMatrixMultiplyReshaped>;

63

64

// Fixture for GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture

65

template <typename T>

66

using CLGEMMMatrixMultiplyReshaped3DFixture =

67

GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture<CLTensor, CLAccessor, T, CLGEMMReshapeLHSMatrix, CLGEMMReshapeRHSMatrix, CLGEMMMatrixMultiplyReshaped>;

namespace

{

// *INDENT-OFF*

// clang-format off

RelativeTolerance<float> rel_tolerance_f32(0.001f);

74

constexpr float abs_tolerance_f32(0.0001f);

75

76

RelativeTolerance<half> rel_tolerance_f16(half(0.2));

77

constexpr float tolerance_num_f16 = 0.02f;

78

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

79

/** Alpha values to test */

Gian Marco Iodice

f3622be

2019-07-29 14:27:16 +0100

[diff] [blame]

80

const auto alpha_values = framework::dataset::make("alpha", {1.0f, -0.75f} );

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

81

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

82

/** Beta values to test */

Gian Marco Iodice

d820db6

2019-08-05 14:23:23 +0100

[diff] [blame]

83

const auto beta_values = framework::dataset::make("beta", {-0.35f, 0.0f} );

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

84

SiCong Li

7e5b7bf

2020-11-17 09:41:13 +0000

[diff] [blame]

85

/** M, N combinations to test

86

* 1: Special 1x1 case

87

* 2: Special multples of processor size in both dimensions

88

* 3: Non multiples of processor size in both dimensions

89

*/

90

const auto m_n_values = zip(

91

framework::dataset::make("M", {1, 16, 37}),

92

framework::dataset::make("N", {1, 16, 51})

93

);

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

94

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

95

/** N values to test */

96

const auto n_values = framework::dataset::make("N", 51);

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

97

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

98

/** K values to test */

99

const auto k_values = framework::dataset::make("K", 23);

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

100

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

101

/** M_W values to test */

102

const auto m_w_values = framework::dataset::make("M_W", 5);

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

103

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

104

/** M_H values to test */

105

const auto m_h_values = framework::dataset::make("M_H", 7);

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

106

107

/** Batch size values to test */

108

const auto b_values = framework::dataset::make("batch_size", 1, 3);

109

110

/** Activation values to test */

111

const auto act_values = framework::dataset::make("Activation",

112

{

113

ActivationLayerInfo(),

114

ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU, 8.f, 2.f),

115

});

116

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

117

/** V0 values to test */

118

const auto v0_values = framework::dataset::make("V0", 2);

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

119

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

120

/** H0 values to test */

121

const auto h0_values = framework::dataset::make("H0", 4);

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

122

123

/** Broadcast bias from vector to matrix */

124

const auto broadcast_bias_values = framework::dataset::make("broadcast_bias", {false, true} );

125

126

/** GPU architectures values to test */

127

const auto gpu_arch_values = framework::dataset::make("GPUArch",

{

GPUTarget::MIDGARD,

GPUTarget::BIFROST

});

/** Data types values to test in the configuration */

134

const auto data_type_values = framework::dataset::make("DataType",

{

DataType::F32,

DataType::F16

});

/** M values to test */

141

const auto fp16_mixed_precision_values = framework::dataset::make("fp16_mixed_precision", {true, false});

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

} // namespace

TEST_SUITE(CL)

TEST_SUITE(GEMMMatrixMultiplyInterleavedTransposed)

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

146

TEST_CASE(Negative, framework::DatasetMode::ALL)

147

{

148

// The following tests are already integrated in the GEMMMatrixMultiply validation because

149

// in common with this validation

150

// - Unsupported QASYMM8 data type

151

// - Unsupported SIZE_T data type

152

// - Mixed precision with F32

153

// - Max number of dimensions LHS matrix

154

// - Max number of dimensions RHS matrix

155

156

// Invalid LHS dimensions

157

{

158

// The correct shape should be: lhs = TensorInfo(TensorShape(256U, 1U, 1U, 1U), 1, DataType::F32);

159

const auto lhs = TensorInfo(TensorShape(256U, 2U, 1U, 1U), 1, DataType::F32);

160

const auto rhs = TensorInfo(TensorShape(104U, 3U, 1U, 1U), 1, DataType::F32);

161

const auto bias = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

162

const auto out = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

163

constexpr float alpha = 1.3f;

164

constexpr float beta = 0.7f;

165

const bool is_interleaved_transposed = true;

166

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(16, 24, 13, 2, 4, 0, false, false);

167

const GPUTarget gpu_target = GPUTarget::MIDGARD;

168

const bool fp_mixed_precision = false;

169

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, &bias, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target, fp_mixed_precision);

170

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

171

}

172

173

// Invalid RHS dimensions

174

{

175

const auto lhs = TensorInfo(TensorShape(256U, 1U, 1U, 1U), 1, DataType::F32);

176

// The correct shape should be rhs = TensorInfo(TensorShape(104U, 3U, 1U, 1U), 1, DataType::F32);

177

const auto rhs = TensorInfo(TensorShape(104U, 4U, 1U, 1U), 1, DataType::F32);

178

const auto bias = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

179

const auto out = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

180

constexpr float alpha = 1.3f;

181

constexpr float beta = 0.7f;

182

const bool is_interleaved_transposed = true;

183

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(16, 24, 13, 2, 4, 0, false, false);

184

const GPUTarget gpu_target = GPUTarget::MIDGARD;

185

const bool fp_mixed_precision = false;

186

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, &bias, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target, fp_mixed_precision);

187

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

}

// Broadcast bias

{

const auto lhs = TensorInfo(TensorShape(256U, 1U, 1U, 1U), 1, DataType::F32);

193

const auto rhs = TensorInfo(TensorShape(104U, 3U, 1U, 1U), 1, DataType::F32);

194

// The correct shape should be bias = TensorInfo(TensorShape(24U, 1U, 1U, 1U), 1, DataType::F32);

195

const auto bias = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

196

const auto out = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

197

constexpr float alpha = 1.3f;

198

constexpr float beta = 0.7f;

199

const bool is_interleaved_transposed = true;

200

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(16, 24, 13, 2, 4, 0, false, true);

201

const GPUTarget gpu_target = GPUTarget::MIDGARD;

202

const bool fp_mixed_precision = false;

203

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, &bias, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target, fp_mixed_precision);

204

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

205

}

206

207

// Invalid dimensions for the bias

208

{

209

const auto lhs = TensorInfo(TensorShape(256U, 1U, 1U, 1U), 1, DataType::F32);

210

const auto rhs = TensorInfo(TensorShape(104U, 3U, 1U, 1U), 1, DataType::F32);

211

// The correct shape should be bias = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

212

const auto bias = TensorInfo(TensorShape(25U, 16U, 1U, 1U), 1, DataType::F32);

213

const auto out = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

214

constexpr float alpha = 1.3f;

215

constexpr float beta = 0.7f;

216

const bool is_interleaved_transposed = true;

217

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(16, 24, 13, 2, 4, 0, false, false);

218

const GPUTarget gpu_target = GPUTarget::MIDGARD;

219

const bool fp_mixed_precision = false;

220

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, &bias, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target, fp_mixed_precision);

221

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

222

}

223

224

// Invalid dimensions for the output

225

{

226

const auto lhs = TensorInfo(TensorShape(256U, 1U, 1U, 1U), 1, DataType::F32);

227

const auto rhs = TensorInfo(TensorShape(104U, 3U, 1U, 1U), 1, DataType::F32);

228

const auto bias = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

229

// The correct shape should be out = TensorInfo(TensorShape(24U, 16U, 1U, 1U), 1, DataType::F32);

230

const auto out = TensorInfo(TensorShape(24U, 13U, 1U, 1U), 1, DataType::F32);

231

constexpr float alpha = 1.3f;

232

constexpr float beta = 0.7f;

233

const bool is_interleaved_transposed = true;

234

const GEMMReshapeInfo reshape_info = GEMMReshapeInfo(16, 24, 13, 2, 4, 0, false, false);

235

const GPUTarget gpu_target = GPUTarget::MIDGARD;

236

const bool fp_mixed_precision = false;

237

const auto status = CLGEMMMatrixMultiplyKernel::validate(&lhs, &rhs, &bias, &out, alpha, beta, is_interleaved_transposed, reshape_info, gpu_target, fp_mixed_precision);

238

ARM_COMPUTE_EXPECT(bool(status) == false, framework::LogLevel::ERRORS);

}

}

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

242

TEST_SUITE(Float)

243

TEST_SUITE(FP32)

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

244

FIXTURE_DATA_TEST_CASE(RunSmall, CLGEMMMatrixMultiplyReshapedFixture<float>, framework::DatasetMode::ALL,

SiCong Li

7e5b7bf

2020-11-17 09:41:13 +0000

[diff] [blame]

245

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

246

m_n_values,

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

247

k_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

248

b_values),

249

alpha_values),

250

beta_values),

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

251

v0_values),

252

h0_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

253

broadcast_bias_values),

254

framework::dataset::make("fp16_mixed_precision", false)),

255

act_values),

256

framework::dataset::make("DataType", DataType::F32)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

261

}

262

263

FIXTURE_DATA_TEST_CASE(RunSmall3D, CLGEMMMatrixMultiplyReshaped3DFixture<float>, framework::DatasetMode::ALL,

264

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

m_w_values,

m_h_values),

n_values),

k_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

269

b_values),

270

alpha_values),

271

beta_values),

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

272

v0_values),

273

h0_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

274

broadcast_bias_values),

275

framework::dataset::make("fp16_mixed_precision", false)),

276

act_values),

277

framework::dataset::make("DataType", DataType::F32)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

282

}

283

284

TEST_SUITE_END() // FP32

285

286

TEST_SUITE(FP16)

287

FIXTURE_DATA_TEST_CASE(RunSmall, CLGEMMMatrixMultiplyReshapedFixture<half>, framework::DatasetMode::ALL,

SiCong Li

7e5b7bf

2020-11-17 09:41:13 +0000

[diff] [blame]

288

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

289

m_n_values,

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

290

k_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

291

b_values),

292

alpha_values),

293

beta_values),

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

294

v0_values),

295

h0_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

296

broadcast_bias_values),

297

fp16_mixed_precision_values),

298

act_values),

299

framework::dataset::make("DataType", DataType::F16)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f16, tolerance_num_f16);

304

}

305

306

FIXTURE_DATA_TEST_CASE(RunSmall3D, CLGEMMMatrixMultiplyReshaped3DFixture<half>, framework::DatasetMode::ALL,

307

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

m_w_values,

m_h_values),

n_values),

k_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

312

b_values),

313

alpha_values),

314

beta_values),

Gian Marco Iodice

c630e94

2020-05-11 12:15:54 +0100

[diff] [blame]

315

v0_values),

316

h0_values),

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

317

broadcast_bias_values),

318

fp16_mixed_precision_values),

319

act_values),

320

framework::dataset::make("DataType", DataType::F16)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f16, tolerance_num_f16);

325

}

326

327

TEST_SUITE_END() // FP16

328

TEST_SUITE_END() // Float

329

TEST_SUITE_END() // GEMMMatrixMulipltyInterleavedTransposed

330

TEST_SUITE_END() // CL

331

} // namespace validation

332

} // namespace test

333

} // namespace arm_compute