Blame - tests/validation/CL/GEMMMatrixMultiplyInterleavedTransposed.cpp - ml/ComputeLibrary

GEMMMatrixMultiplyInterleavedTransposedValidationFixture<CLTensor, CLAccessor, T, CLGEMMReshapeLHSMatrix, CLGEMMReshapeRHSMatrix, CLGEMMMatrixMultiplyReshaped>;

63

64

// Fixture for GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture

65

template <typename T>

66

using CLGEMMMatrixMultiplyReshaped3DFixture =

67

GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture<CLTensor, CLAccessor, T, CLGEMMReshapeLHSMatrix, CLGEMMReshapeRHSMatrix, CLGEMMMatrixMultiplyReshaped>;

namespace

{

// *INDENT-OFF*

// clang-format off

RelativeTolerance<float> rel_tolerance_f32(0.001f);

74

constexpr float abs_tolerance_f32(0.0001f);

75

76

RelativeTolerance<half> rel_tolerance_f16(half(0.2));

77

constexpr float tolerance_num_f16 = 0.02f;

78

79

/** Alpha values to test - Precommit */

Gian Marco Iodice

f3622be

2019-07-29 14:27:16 +0100

[diff] [blame]

80

const auto alpha_values = framework::dataset::make("alpha", {1.0f, -0.75f} );

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

81

82

/** Beta values to test - Precommit */

Gian Marco Iodice

d820db6

2019-08-05 14:23:23 +0100

[diff] [blame]

83

const auto beta_values = framework::dataset::make("beta", {-0.35f, 0.0f} );

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

84

85

/** M values to test - Precommit */

86

const auto m_values_precommit = framework::dataset::make("M", 37);

87

88

/** N values to test - Precommit */

89

const auto n_values_precommit = framework::dataset::make("N", 51);

90

91

/** K values to test - Precommit */

92

const auto k_values_precommit = framework::dataset::make("K", 23);

93

94

/** M values to test - Nightly */

95

const auto m_values_nightly = framework::dataset::make("M", {421, 1});

96

97

/** N values to test - Nightly */

98

const auto n_values_nightly = framework::dataset::make("N", 323);

99

100

/** K values to test - Nightly */

101

const auto k_values_nightly = framework::dataset::make("K", 207);

102

103

/** M_W values to test - Precommit */

104

const auto m_w_values_precommit = framework::dataset::make("M_W", 5);

105

106

/** M_H values to test - Precommit */

107

const auto m_h_values_precommit = framework::dataset::make("M_H", 7);

108

109

/** M_W values to test - Nightly */

110

const auto m_w_values_nightly = framework::dataset::make("M_W", 13);

111

112

/** M_H values to test - Nightly */

113

const auto m_h_values_nightly = framework::dataset::make("M_H", 27);

114

115

/** Batch size values to test */

116

const auto b_values = framework::dataset::make("batch_size", 1, 3);

117

118

/** Activation values to test */

119

const auto act_values = framework::dataset::make("Activation",

120

{

121

ActivationLayerInfo(),

122

ActivationLayerInfo(ActivationLayerInfo::ActivationFunction::LU_BOUNDED_RELU, 8.f, 2.f),

123

});

124

125

/** V0 values to test - Precommit */

126

const auto v0_values_precommit = framework::dataset::make("V0", 2);

127

128

/** H0 values to test - Precommit */

129

const auto h0_values_precommit = framework::dataset::make("H0", 4);

130

131

/** V0 values to test - Nightly */

132

const auto v0_values_nightly = framework::dataset::make("V0", {2, 4});

133

134

/** H0 values to test - Nightly */

135

const auto h0_values_nightly = framework::dataset::make("H0", { 2, 4 });

136

137

/** Broadcast bias from vector to matrix */

138

const auto broadcast_bias_values = framework::dataset::make("broadcast_bias", {false, true} );

139

140

/** GPU architectures values to test */

141

const auto gpu_arch_values = framework::dataset::make("GPUArch",

{

GPUTarget::MIDGARD,

GPUTarget::BIFROST

});

/** Data types values to test in the configuration */

148

const auto data_type_values = framework::dataset::make("DataType",

{

DataType::F32,

DataType::F16

});

/** M values to test */

155

const auto fp16_mixed_precision_values = framework::dataset::make("fp16_mixed_precision", {true, false});

156

157

/** Configuration test */

158

void validate_configuration(unsigned int m_value, unsigned int n_value, unsigned int k_value, unsigned int b_value, unsigned int v0_value, unsigned int h0_value, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch_value)

159

{

160

GEMMLHSMatrixInfo lhs_info;

161

lhs_info.m0 = 4;

162

lhs_info.k0 = 4;

163

lhs_info.v0 = v0_value;

164

lhs_info.interleave = true;

165

lhs_info.transpose = true;

166

167

GEMMRHSMatrixInfo rhs_info;

168

rhs_info.n0 = data_type == DataType::F32? 4 : 8;

169

rhs_info.k0 = 1;

170

rhs_info.h0 = h0_value;

171

rhs_info.interleave = false;

172

rhs_info.transpose = false;

173

174

GEMMReshapeInfo reshape_info(m_value, n_value, k_value, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

175

176

const TensorShape lhs_shape(k_value, m_value, b_value);

177

const TensorShape lhs_shape_reshaped = compute_lhs_reshaped_shape(TensorInfo(lhs_shape, 1, data_type),

lhs_info,

false);

const TensorShape rhs_shape(n_value, k_value, b_value);

182

const TensorShape rhs_shape_reshaped = compute_rhs_reshaped_shape(TensorInfo(rhs_shape, 1, data_type),

183

rhs_info);

184

185

const TensorShape dst_shape = compute_mm_shape(TensorInfo(lhs_shape_reshaped, 1, data_type),

186

TensorInfo(rhs_shape_reshaped, 1, data_type),

187

reshape_info);

188

189

const TensorShape bias_shape(n_value,

190

broadcast_bias? 1 : m_value,

191

broadcast_bias? 1 : b_value);

192

193

// Create tensors

194

CLTensor lhs_reshaped = create_tensor<CLTensor>(lhs_shape_reshaped, data_type);

195

CLTensor rhs_reshaped = create_tensor<CLTensor>(rhs_shape_reshaped, data_type);

196

CLTensor bias = create_tensor<CLTensor>(bias_shape, data_type);

197

CLTensor dst = create_tensor<CLTensor>(dst_shape, data_type);

198

199

ARM_COMPUTE_EXPECT(lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

200

ARM_COMPUTE_EXPECT(rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

201

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

202

ARM_COMPUTE_EXPECT(dst.info()->is_resizable(), framework::LogLevel::ERRORS);

203

204

// Create and configure function

205

CLGEMMMatrixMultiplyReshaped gemm;

206

gemm.configure(gpu_arch_value, &lhs_reshaped, &rhs_reshaped, &bias, &dst, 1.0f, 2.0f, true, reshape_info, fp16_mixed_precision, act_info);

}

} // namespace

TEST_SUITE(CL)

TEST_SUITE(GEMMMatrixMultiplyInterleavedTransposed)

212

TEST_SUITE(Float)

213

TEST_SUITE(FP32)

214

DATA_TEST_CASE(Configuration, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

m_values_precommit,

n_values_precommit),

k_values_precommit),

framework::dataset::make("batch_size", 1)),

219

v0_values_precommit),

220

h0_values_precommit),

221

broadcast_bias_values),

222

framework::dataset::make("fp16_mixed_precision", false)),

act_values),

data_type_values),

gpu_arch_values),

m_value, n_value, k_value, b_value, v0_value, h0_value, broadcast_bias, fp16_mixed_precision_value, act_value, data_type_value, gpu_arch_value)

227

{

228

validate_configuration(m_value, n_value, k_value, b_value, v0_value, h0_value, broadcast_bias, fp16_mixed_precision_value, act_value, data_type_value, gpu_arch_value);

229

}

230

231

FIXTURE_DATA_TEST_CASE(RunSmall, CLGEMMMatrixMultiplyReshapedFixture<float>, framework::DatasetMode::ALL,

232

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

m_values_precommit,

n_values_precommit),

k_values_precommit),

b_values),

alpha_values),

beta_values),

v0_values_precommit),

240

h0_values_precommit),

241

broadcast_bias_values),

242

framework::dataset::make("fp16_mixed_precision", false)),

243

act_values),

244

framework::dataset::make("DataType", DataType::F32)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

249

}

250

251

FIXTURE_DATA_TEST_CASE(RunLarge, CLGEMMMatrixMultiplyReshapedFixture<float>, framework::DatasetMode::NIGHTLY,

252

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

m_values_nightly,

n_values_nightly),

k_values_nightly),

b_values),

alpha_values),

beta_values),

v0_values_nightly),

h0_values_nightly),

broadcast_bias_values),

262

framework::dataset::make("fp16_mixed_precision", false)),

263

act_values),

264

framework::dataset::make("DataType", DataType::F32)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

269

}

270

271

FIXTURE_DATA_TEST_CASE(RunSmall3D, CLGEMMMatrixMultiplyReshaped3DFixture<float>, framework::DatasetMode::ALL,

272

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

273

m_w_values_precommit,

274

m_h_values_precommit),

n_values_precommit),

k_values_precommit),

b_values),

alpha_values),

beta_values),

v0_values_precommit),

281

h0_values_precommit),

282

broadcast_bias_values),

283

framework::dataset::make("fp16_mixed_precision", false)),

284

act_values),

285

framework::dataset::make("DataType", DataType::F32)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

290

}

291

292

FIXTURE_DATA_TEST_CASE(RunLarge3D, CLGEMMMatrixMultiplyReshaped3DFixture<float>, framework::DatasetMode::NIGHTLY,

293

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

m_w_values_nightly,

m_h_values_nightly),

n_values_nightly),

k_values_nightly),

b_values),

alpha_values),

beta_values),

v0_values_nightly),

h0_values_nightly),

broadcast_bias_values),

304

framework::dataset::make("fp16_mixed_precision", false)),

305

act_values),

306

framework::dataset::make("DataType", DataType::F32)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

311

}

312

313

TEST_SUITE_END() // FP32

314

315

TEST_SUITE(FP16)

316

FIXTURE_DATA_TEST_CASE(RunSmall, CLGEMMMatrixMultiplyReshapedFixture<half>, framework::DatasetMode::ALL,

317

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

m_values_precommit,

n_values_precommit),

k_values_precommit),

b_values),

alpha_values),

beta_values),

v0_values_precommit),

325

h0_values_precommit),

326

broadcast_bias_values),

327

fp16_mixed_precision_values),

328

act_values),

329

framework::dataset::make("DataType", DataType::F16)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f16, tolerance_num_f16);

334

}

335

336

FIXTURE_DATA_TEST_CASE(RunLarge, CLGEMMMatrixMultiplyReshapedFixture<half>, framework::DatasetMode::NIGHTLY,

337

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

m_values_nightly,

n_values_nightly),

k_values_nightly),

b_values),

alpha_values),

beta_values),

v0_values_nightly),

h0_values_nightly),

broadcast_bias_values),

347

fp16_mixed_precision_values),

348

act_values),

349

framework::dataset::make("DataType", DataType::F16)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f16, tolerance_num_f16);

354

}

355

356

FIXTURE_DATA_TEST_CASE(RunSmall3D, CLGEMMMatrixMultiplyReshaped3DFixture<half>, framework::DatasetMode::ALL,

357

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

358

m_w_values_precommit,

359

m_h_values_precommit),

n_values_precommit),

k_values_precommit),

b_values),

alpha_values),

beta_values),

v0_values_precommit),

366

h0_values_precommit),

367

broadcast_bias_values),

368

fp16_mixed_precision_values),

369

act_values),

370

framework::dataset::make("DataType", DataType::F16)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f16, tolerance_num_f16);

375

}

376

377

FIXTURE_DATA_TEST_CASE(RunLarge3D, CLGEMMMatrixMultiplyReshaped3DFixture<half>, framework::DatasetMode::NIGHTLY,

378

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

m_w_values_nightly,

m_h_values_nightly),

n_values_nightly),

k_values_nightly),

b_values),

alpha_values),

beta_values),

v0_values_nightly),

h0_values_nightly),

broadcast_bias_values),

389

fp16_mixed_precision_values),

390

act_values),

391

framework::dataset::make("DataType", DataType::F16)),

gpu_arch_values))

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f16, tolerance_num_f16);

396

}

397

398

TEST_SUITE_END() // FP16

399

TEST_SUITE_END() // Float

400

TEST_SUITE_END() // GEMMMatrixMulipltyInterleavedTransposed

401

TEST_SUITE_END() // CL

402

} // namespace validation

403

} // namespace test

404

} // namespace arm_compute