Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

48

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

49

{

50

public:

51

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

52

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

54

ARM_COMPUTE_UNUSED(pretranspose);

55

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

56

_reference = compute_reference(shape_a, shape_b, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

61

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

62

{

63

switch(tensor.data_type())

{

case DataType::F16:

case DataType::F32:

{

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

68

std::uniform_real_distribution<> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

69

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

78

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

79

{

80

// Create tensors

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

81

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

82

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

83

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

84

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

85

86

// Create and configure function

87

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

88

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

89

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

90

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

91

gemm.configure(&a,

92

&b,

93

(disable_c) ? nullptr : &c,

94

&dst,

95

alpha, beta,

96

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, (reinterpret_input_as_3d

97

|| reinterpret_output_as_3d)));

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

98

ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);

99

ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

100

ARM_COMPUTE_EXPECT(c.info()->is_resizable(), framework::LogLevel::ERRORS);

101

ARM_COMPUTE_EXPECT(dst.info()->is_resizable(), framework::LogLevel::ERRORS);

102

103

// Allocate tensors

104

a.allocator()->allocate();

105

b.allocator()->allocate();

106

c.allocator()->allocate();

107

dst.allocator()->allocate();

108

109

ARM_COMPUTE_EXPECT(!a.info()->is_resizable(), framework::LogLevel::ERRORS);

110

ARM_COMPUTE_EXPECT(!b.info()->is_resizable(), framework::LogLevel::ERRORS);

111

ARM_COMPUTE_EXPECT(!c.info()->is_resizable(), framework::LogLevel::ERRORS);

112

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

113

114

// Fill tensors

115

fill(AccessorType(a), 0);

116

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

117

if(!disable_c)

118

{

119

fill(AccessorType(c), 2);

120

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

121

122

// Compute GEMM function

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

128

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

129

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

130

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

131

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

132

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

133

if(reinterpret_input_as_3d)

134

{

135

// Collapse the second and third dimension if the input is 3D

136

shape_a_to_use.collapse(2U, 1U);

137

}

138

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

139

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

140

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

141

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

142

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

147

fill(c, 2);

148

149

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

150

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

151

const int n = shape_b[0];

152

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

153

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

154

155

// In case of broadcast, we need simply copy the first into the following "M" ones

156

for(int i = 1; i < m * batch_size; i++)

157

{

158

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

159

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

160

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

161

162

// Setting beta to 0 will effectively disable C for the

163

// computation of the reference: alpha * A * B + 0 * C

164

return reference::gemm<T>(a, b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

165

}

166

167

TensorType _target{};

168

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

169

};

170

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

171

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

172

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

173

{

174

public:

175

template <typename...>

176

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

177

DataType data_type, GPUTarget gpu_arch)

178

{

179

// Set the tensor shapes for LHS and RHS matrices

180

const TensorShape lhs_shape(k, m, batch_size);

181

const TensorShape rhs_shape(n, k, batch_size);

182

const TensorShape bias_shape(n,

183

broadcast_bias ? 1 : m,

184

broadcast_bias ? 1 : batch_size);

185

186

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

187

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

192

void fill(U &&tensor, int i)

193

{

194

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

195

library->fill(tensor, distribution, i);

196

197

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

198

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

199

library->fill_borders_with_garbage(tensor, distribution_inf, i);

200

}

201

202

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

203

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

204

{

205

// Create tensors

206

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

207

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

208

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

209

TensorType dst;

210

211

const unsigned int m = lhs_shape[1];

212

const unsigned int n = rhs_shape[0];

213

const unsigned int k = lhs_shape[0];

214

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

215

216

// The output tensor will be auto-initialized within the function

217

218

// Create and configure function

219

GEMMFunctionType gemm;

220

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

221

222

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

223

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

224

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

225

226

// Allocate tensors

227

lhs.allocator()->allocate();

228

rhs.allocator()->allocate();

229

bias.allocator()->allocate();

230

dst.allocator()->allocate();

231

232

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

233

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

234

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

235

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

236

237

// Fill tensors

238

fill(AccessorType(lhs), 0);

239

fill(AccessorType(rhs), 1);

240

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

248

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

249

const ActivationLayerInfo &act_info)

250

{

251

TensorShape dst_shape = lhs_shape;

252

dst_shape[0] = rhs_shape[0];

253

dst_shape[1] = lhs_shape[1];

254

255

// Create reference

256

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

257

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

258

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

259

260

const int n = rhs_shape[0];

261

const int m = lhs_shape[1];

262

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

272

for(int i = 1; i < m * batch_size; i++)

273

{

274

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

279

}

280

281

TensorType _target{};

282

SimpleTensor<T> _reference{};

283

};

284

285

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

286

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

287

{

288

public:

289

template <typename...>

290

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

291

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

292

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

293

ARM_COMPUTE_UNUSED(broadcast_bias);

294

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

295

// In case of GEMM3D, m is the product between m_w and m_h

296

const unsigned int m = m_w * m_h;

297

298

// Set the tensor shapes for LHS and RHS matrices

299

const TensorShape lhs_shape(k, m, batch_size);

300

const TensorShape rhs_shape(n, k, batch_size);

301

const TensorShape bias_shape(n, 1, 1);

302

303

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

304

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

309

void fill(U &&tensor, int i)

310

{

311

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

312

library->fill(tensor, distribution, i);

313

}

314

315

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

316

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

317

{

318

// Create tensors

319

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

320

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

321

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

322

TensorType dst;

323

324

const unsigned int m = lhs_shape[1];

325

const unsigned int n = rhs_shape[0];

326

const unsigned int k = lhs_shape[0];

327

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

328

329

// The output tensor will be auto-initialized within the function

330

331

// Create and configure function

332

GEMMFunctionType gemm;

333

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

334

335

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

336

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

337

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

338

339

// Allocate tensors

340

lhs.allocator()->allocate();

341

rhs.allocator()->allocate();

342

bias.allocator()->allocate();

343

dst.allocator()->allocate();

344

345

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

346

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

347

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

348

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

349

350

// Fill tensors

351

fill(AccessorType(lhs), 0);

352

fill(AccessorType(rhs), 1);

353

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

361

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

362

const ActivationLayerInfo &act_info)

363

{

364

TensorShape dst_shape = lhs_shape;

365

dst_shape.set(0, rhs_shape[0]);

366

dst_shape.set(1, lhs_shape[1] / m_h);

367

dst_shape.set(2, m_h);

368

dst_shape.set(3, lhs_shape[2]);

369

370

// Create reference

371

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

372

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

373

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

374

375

const int n = rhs_shape[0];

376

const int m = lhs_shape[1];

377

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

385

for(int i = 1; i < m * batch_size; i++)

386

{

387

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

388

}

389

390

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

391

}

392

393

TensorType _target{};

394

SimpleTensor<T> _reference{};

395

};

396

397

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

398

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

399

{

400

public:

401

template <typename...>

402

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

403

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

404

{

405

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

410

lhs_info.transpose = true;

411

412

GEMMRHSMatrixInfo rhs_info;

413

rhs_info.n0 = 16 / sizeof(T);

414

rhs_info.k0 = 1;

415

rhs_info.h0 = h0;

416

rhs_info.interleave = false;

417

rhs_info.transpose = false;

418

419

// Set the tensor shapes for LHS and RHS matrices

420

const TensorShape lhs_shape(k, m, batch_size);

421

const TensorShape rhs_shape(n, k, batch_size);

422

const TensorShape bias_shape(n,

423

broadcast_bias ? 1 : m,

424

broadcast_bias ? 1 : batch_size);

425

426

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

427

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

432

void fill(U &&tensor, int i)

433

{

434

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

435

library->fill(tensor, distribution, i);

436

437

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

438

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

439

library->fill_borders_with_garbage(tensor, distribution_inf, i);

440

}

441

442

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

443

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

444

{

445

// Create tensors

446

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

447

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

448

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

449

TensorType lhs_reshaped;

450

TensorType rhs_reshaped;

451

TensorType dst;

452

453

const unsigned int m = lhs_shape[1];

454

const unsigned int n = rhs_shape[0];

455

const unsigned int k = lhs_shape[0];

456

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

457

458

// The output tensor will be auto-initialized within the function

459

460

// Create and configure function

461

ReshapeLHSFunctionType reshape_lhs;

462

ReshapeRHSFunctionType reshape_rhs;

463

GEMMFunctionType gemm;

464

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

465

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

466

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

467

468

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

469

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

470

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

471

472

// Allocate tensors

473

lhs.allocator()->allocate();

474

rhs.allocator()->allocate();

475

lhs_reshaped.allocator()->allocate();

476

rhs_reshaped.allocator()->allocate();

477

bias.allocator()->allocate();

478

dst.allocator()->allocate();

479

480

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

481

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

482

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

483

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

484

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

485

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

486

487

// Fill tensors

488

fill(AccessorType(lhs), 0);

489

fill(AccessorType(rhs), 1);

490

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

500

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

501

const ActivationLayerInfo &act_info)

502

{

503

TensorShape dst_shape = lhs_shape;

504

dst_shape[0] = rhs_shape[0];

505

dst_shape[1] = lhs_shape[1];

506

507

// Create reference

508

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

509

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

510

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

511

512

const int n = rhs_shape[0];

513

const int m = lhs_shape[1];

514

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

524

for(int i = 1; i < m * batch_size; i++)

525

{

526

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

531

}

532

533

TensorType _target{};

534

SimpleTensor<T> _reference{};

535

};

536

537

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

538

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

539

{

540

public:

541

template <typename...>

542

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

543

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

544

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

545

ARM_COMPUTE_UNUSED(broadcast_bias);

546

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

547

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

552

lhs_info.transpose = true;

553

554

GEMMRHSMatrixInfo rhs_info;

555

rhs_info.n0 = 16 / sizeof(T);

556

rhs_info.k0 = 1;

557

rhs_info.h0 = h0;

558

rhs_info.interleave = false;

559

rhs_info.transpose = false;

560

561

// In case of GEMM3D, m is the product between m_w and m_h

562

const unsigned int m = m_w * m_h;

563

564

// Set the tensor shapes for LHS and RHS matrices

565

const TensorShape lhs_shape(k, m, batch_size);

566

const TensorShape rhs_shape(n, k, batch_size);

567

const TensorShape bias_shape(n, 1, 1);

568

569

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

570

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

575

void fill(U &&tensor, int i)

576

{

577

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

578

library->fill(tensor, distribution, i);

579

}

580

581

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

582

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

583

{

584

// Create tensors

585

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

586

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

587

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

588

TensorType lhs_reshaped;

589

TensorType rhs_reshaped;

590

TensorType dst;

591

592

const unsigned int m = lhs_shape[1];

593

const unsigned int n = rhs_shape[0];

594

const unsigned int k = lhs_shape[0];

595

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

596

597

// The output tensor will be auto-initialized within the function

598

599

// Create and configure function

600

ReshapeLHSFunctionType reshape_lhs;

601

ReshapeRHSFunctionType reshape_rhs;

602

GEMMFunctionType gemm;

603

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

604

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

605

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

606

607

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

608

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

609

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

610

611

// Allocate tensors

612

lhs.allocator()->allocate();

613

rhs.allocator()->allocate();

614

lhs_reshaped.allocator()->allocate();

615

rhs_reshaped.allocator()->allocate();

616

bias.allocator()->allocate();

617

dst.allocator()->allocate();

618

619

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

620

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

621

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

622

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

623

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

624

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

625

626

// Fill tensors

627

fill(AccessorType(lhs), 0);

628

fill(AccessorType(rhs), 1);

629

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

639

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

640

const ActivationLayerInfo &act_info)

641

{

642

TensorShape dst_shape = lhs_shape;

643

dst_shape.set(0, rhs_shape[0]);

644

dst_shape.set(1, lhs_shape[1] / m_h);

645

dst_shape.set(2, m_h);

646

dst_shape.set(3, lhs_shape[2]);

647

648

// Create reference

649

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

650

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

651

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

652

653

const int n = rhs_shape[0];

654

const int m = lhs_shape[1];

655

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

663

for(int i = 1; i < m * batch_size; i++)

664

{

665

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

666

}

667

668

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

669

}

670

671

TensorType _target{};

672

SimpleTensor<T> _reference{};

673

};

674

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

675

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

676

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

677

{

678

public:

679

template <typename...>

680

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

681

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

682

{

683

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

688

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

689

690

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

695

rhs_info.transpose = !lhs_transpose;

696

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

697

698

// Set the tensor shapes for LHS and RHS matrices

699

const TensorShape lhs_shape(k, m, batch_size);

700

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

701

const TensorShape bias_shape(n,

702

broadcast_bias ? 1 : m,

703

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

704

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

705

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

706

if(validate_result)

707

{

708

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

709

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

714

void fill(U &&tensor, int i)

715

{

716

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

717

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

718

719

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

720

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

721

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

722

}

723

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

724

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

725

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

726

{

727

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

728

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

729

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

730

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

731

TensorType lhs_reshaped;

732

TensorType rhs_reshaped;

733

TensorType dst;

734

735

const unsigned int M = lhs_shape[1];

736

const unsigned int N = rhs_shape[0];

737

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

738

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

743

kernel_info.reinterpret_input_as_3d = false;

744

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

745

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

746

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

747

748

// The output tensor will be auto-initialized within the function

749

750

// Create and configure function

751

ReshapeLHSFunctionType reshape_lhs;

752

ReshapeRHSFunctionType reshape_rhs;

753

GEMMFunctionType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

754

755

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

756

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

762

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

763

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

764

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

765

766

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

767

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

768

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

769

770

// Allocate tensors

771

lhs.allocator()->allocate();

772

rhs.allocator()->allocate();

773

lhs_reshaped.allocator()->allocate();

774

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

775

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

776

dst.allocator()->allocate();

777

778

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

779

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

780

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

781

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

782

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

783

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

784

785

// Fill tensors

786

fill(AccessorType(lhs), 0);

787

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

788

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

798

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

799

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

800

{

801

TensorShape dst_shape = lhs_shape;

802

dst_shape[0] = rhs_shape[0];

803

dst_shape[1] = lhs_shape[1];

804

805

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

806

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

807

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

808

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

809

810

const int n = rhs_shape[0];

811

const int m = lhs_shape[1];

812

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

817

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

818

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

819

if(broadcast_bias)

820

{

821

// In case of broadcast, we need simply copy the first into the following "M" ones

822

for(int i = 1; i < m * batch_size; i++)

823

{

824

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

828

if(fp_mixed_precision)

829

{

830

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

835

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

836

}

837

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

838

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

839

TensorType _target{};

840

SimpleTensor<T> _reference{};

841

};

842

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

843

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

844

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

845

{

846

public:

847

template <typename...>

848

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

849

bool interleave_lhs, bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

850

{

851

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

856

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

857

858

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

863

rhs_info.transpose = !lhs_transpose;

864

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

865

866

// In case of GEMM3D, m is the product between m_w and m_h

867

const unsigned int m = m_w * m_h;

868

869

// Set the tensor shapes for LHS and RHS matrices

870

const TensorShape lhs_shape(k, m, batch_size);

871

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

872

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

873

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

874

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

875

if(validate_result)

876

{

877

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

878

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

883

void fill(U &&tensor, int i)

884

{

885

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

886

library->fill(tensor, distribution, i);

887

}

888

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

889

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

890

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

891

{

892

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

893

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

894

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

895

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

896

TensorType lhs_reshaped;

897

TensorType rhs_reshaped;

898

TensorType dst;

899

900

const unsigned int M = lhs_shape[1];

901

const unsigned int N = rhs_shape[0];

902

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

903

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

908

kernel_info.reinterpret_input_as_3d = false;

909

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

910

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

911

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

912

913

// The output tensor will be auto-initialized within the function

914

915

// Create and configure function

916

ReshapeLHSFunctionType reshape_lhs;

917

ReshapeRHSFunctionType reshape_rhs;

918

GEMMFunctionType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

919

920

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

921

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

927

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

928

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

929

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

930

931

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

932

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

933

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

934

935

// Allocate tensors

936

lhs.allocator()->allocate();

937

rhs.allocator()->allocate();

938

lhs_reshaped.allocator()->allocate();

939

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

940

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

941

dst.allocator()->allocate();

942

943

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

944

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

945

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

946

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

947

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

948

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

949

950

// Fill tensors

951

fill(AccessorType(lhs), 0);

952

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

953

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

963

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

964

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

965

{

966

TensorShape dst_shape = lhs_shape;

967

dst_shape.set(0, rhs_shape[0]);

968

dst_shape.set(1, lhs_shape[1] / m_h);

969

dst_shape.set(2, m_h);

970

dst_shape.set(3, lhs_shape[2]);

971

972

// Create reference

973

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

974

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

975

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

976

977

const int n = rhs_shape[0];

978

const int m = lhs_shape[1];

979

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

984

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

985

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

986

// In case of broadcast, we need simply copy the first into the following "M" ones

987

for(int i = 1; i < m * batch_size; i++)

988

{

989

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

990

}

991

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

992

if(fp_mixed_precision)

993

{

994

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

999

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1000

}

1001

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1002

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1003

TensorType _target{};

1004

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

1005

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1006

1007

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

1008

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1009

{

1010

public:

1011

template <typename...>

1012

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

1013

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1014

{

1015

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1024

rhs_info.transpose = transpose_rhs;

1025

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1026

1027

// Set the tensor shapes for LHS and RHS matrices

1028

const TensorShape lhs_shape(k, m, batch_size);

1029

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1030

const TensorShape bias_shape(n,

1031

broadcast_bias ? 1 : m,

1032

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1033

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1034

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1035

if(validate_result)

1036

{

1037

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

1038

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1043

void fill(U &&tensor, int i)

1044

{

1045

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1046

library->fill(tensor, distribution, i);

1047

1048

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1049

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1050

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1051

}

1052

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1053

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1054

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1055

{

1056

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1057

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1058

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1059

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1060

TensorType rhs_reshaped;

1061

TensorType dst;

1062

1063

const unsigned int M = lhs_shape[1];

1064

const unsigned int N = rhs_shape[0];

1065

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1066

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1071

kernel_info.reinterpret_input_as_3d = false;

1072

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1073

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1074

1075

// The output tensor will be auto-initialized within the function

1076

1077

// Create and configure function

1078

ReshapeRHSFunctionType reshape_rhs;

1079

GEMMFunctionType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1080

1081

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1082

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1088

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1089

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1090

1091

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1092

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1093

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1094

1095

// Allocate tensors

1096

lhs.allocator()->allocate();

1097

rhs.allocator()->allocate();

1098

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1099

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1100

dst.allocator()->allocate();

1101

1102

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1103

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1104

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1105

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1106

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1107

1108

// Fill tensors

1109

fill(AccessorType(lhs), 0);

1110

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1111

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1120

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1121

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1122

{

1123

TensorShape dst_shape = lhs_shape;

1124

dst_shape[0] = rhs_shape[0];

1125

dst_shape[1] = lhs_shape[1];

1126

1127

// Create reference

1128

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1129

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1130

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1131

1132

const int n = rhs_shape[0];

1133

const int m = lhs_shape[1];

1134

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1139

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1140

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1141

if(broadcast_bias)

1142

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1143

// In case of broadcast, we need simply copy the first into the following "M" ones

1144

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1145

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1146

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1147

}

1148

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1149

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1150

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1151

}

1152

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1153

bool validate_result = true;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1154

TensorType _target{};

1155

SimpleTensor<T> _reference{};

1156

};

1157

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1158

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

1159

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1160

{

1161

public:

1162

template <typename...>

1163

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1164

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, bool has_pad_y, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1165

{

1166

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1175

rhs_info.transpose = transpose_rhs;

1176

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1177

1178

// In case of GEMM3D, m is the product between m_w and m_h

1179

const unsigned int m = m_w * m_h;

1180

1181

// Set the tensor shapes for LHS and RHS matrices

1182

const TensorShape lhs_shape(k, m, batch_size);

1183

const TensorShape rhs_shape(n, k, batch_size);

1184

const TensorShape bias_shape(n, 1, 1);

1185

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1186

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info, has_pad_y);

1187

if(validate_result)

1188

{

1189

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1190

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1195

void fill(U &&tensor, int i)

1196

{

1197

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1198

library->fill(tensor, distribution, i);

1199

}

1200

1201

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1202

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1203

unsigned int m_h, const ActivationLayerInfo &act_info, bool has_pad_y)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1204

{

1205

// Create tensors

1206

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1207

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1208

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1209

TensorType rhs_reshaped;

1210

TensorType dst;

1211

1212

const unsigned int M = lhs_shape[1];

1213

const unsigned int N = rhs_shape[0];

1214

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1215

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1220

kernel_info.reinterpret_input_as_3d = false;

1221

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1222

kernel_info.activation_info = act_info;

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1223

kernel_info.has_pad_y = has_pad_y;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1224

1225

// The output tensor will be auto-initialized within the function

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1226

// Create and configure function

1227

ReshapeRHSFunctionType reshape_rhs;

1228

GEMMFunctionType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1229

1230

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1231

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1237

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1238

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1239

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1240

if(has_pad_y)

1241

{

1242

// Add dummy padding into lhs to validate has_pad_y path

1243

lhs.info()->extend_padding(PaddingSize(2, 0, 2, 0));

1244

dst.info()->extend_padding(PaddingSize(2, 0, 1, 0));

1245

}

1246

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1247

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1248

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1249

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1250

1251

// Allocate tensors

1252

lhs.allocator()->allocate();

1253

rhs.allocator()->allocate();

1254

rhs_reshaped.allocator()->allocate();

1255

bias.allocator()->allocate();

1256

dst.allocator()->allocate();

1257

1258

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1259

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1260

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

1261

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1262

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1263

1264

// Fill tensors

1265

fill(AccessorType(lhs), 0);

1266

fill(AccessorType(rhs), 1);

1267

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1276

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1277

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1278

{

1279

TensorShape dst_shape = lhs_shape;

1280

dst_shape.set(0, rhs_shape[0]);

1281

dst_shape.set(1, lhs_shape[1] / m_h);

1282

dst_shape.set(2, m_h);

1283

dst_shape.set(3, lhs_shape[2]);

1284

1285

// Create reference

1286

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1287

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1288

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1289

1290

const int n = rhs_shape[0];

1291

const int m = lhs_shape[1];

1292

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

1300

for(int i = 1; i < m * batch_size; i++)

1301

{

1302

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1303

}

1304

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1305

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1306

}

1307

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1308

bool validate_result = true;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1309

TensorType _target{};

1310

SimpleTensor<T> _reference{};

1311

};

1312

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1313

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1314

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1315

{

1316

public:

1317

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1318

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1319

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1320

{

1321

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1330

const TensorShape lhs_shape(k, m, batch_size);

1331

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1332

const TensorShape bias_shape(n,

1333

broadcast_bias ? 1 : m,

1334

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1335

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1336

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1337

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1342

void fill(U &&tensor, int i)

1343

{

1344

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1345

library->fill(tensor, distribution, i);

1346

1347

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1348

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1349

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1350

}

1351

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1352

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1353

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1354

{

1355

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1356

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1357

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1358

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1359

TensorType dst;

1360

1361

const unsigned int M = lhs_shape[1];

1362

const unsigned int N = rhs_shape[0];

1363

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1364

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1369

kernel_info.reinterpret_input_as_3d = false;

1370

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1371

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1372

1373

// Create and configure function

1374

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1375

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1376

1377

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1378

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1379

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1380

1381

// Allocate tensors

1382

lhs.allocator()->allocate();

1383

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1384

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1385

dst.allocator()->allocate();

1386

1387

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1388

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1389

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1390

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1391

1392

// Fill tensors

1393

fill(AccessorType(lhs), 0);

1394

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1395

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1403

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1404

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1405

{

1406

TensorShape dst_shape = lhs_shape;

1407

dst_shape[0] = rhs_shape[0];

1408

dst_shape[1] = lhs_shape[1];

1409

1410

// Create reference

1411

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1412

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1413

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1414

1415

const int n = rhs_shape[0];

1416

const int m = lhs_shape[1];

1417

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1422

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1423

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1424

if(broadcast_bias)

1425

{

1426

// In case of broadcast, we need simply copy the first into the following "M" ones

1427

for(int i = 1; i < m * batch_size; i++)

1428

{

1429

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1433

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1434

}

1435

1436

TensorType _target{};

1437

SimpleTensor<T> _reference{};

1438

};

1439

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1440

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1441

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

1442

{

1443

public:

1444

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1445

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

1446

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1447

{

1448

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

1457

const unsigned int m = m_w * m_h;

1458

1459

// Set the tensor shapes for LHS and RHS matrices

1460

const TensorShape lhs_shape(k, m, batch_size);

1461

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1462

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1463

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1464

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1465

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1470

void fill(U &&tensor, int i)

1471

{

1472

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1473

library->fill(tensor, distribution, i);

1474

}

1475

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1476

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1477

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1478

{

1479

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1480

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1481

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1482

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1483

TensorType dst;

1484

1485

const unsigned int M = lhs_shape[1];

1486

const unsigned int N = rhs_shape[0];

1487

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1488

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1493

kernel_info.reinterpret_input_as_3d = false;

1494

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1495

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1496

1497

// The output tensor will be auto-initialized within the function

1498

1499

// Create and configure function

1500

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1501

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1502

1503

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1504

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1505

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1506

1507

// Allocate tensors

1508

lhs.allocator()->allocate();

1509

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1510

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1511

dst.allocator()->allocate();

1512

1513

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1514

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1515

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1516

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1517

1518

// Fill tensors

1519

fill(AccessorType(lhs), 0);

1520

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1521

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1529

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1530

const ActivationLayerInfo &act_info)

giuros01