Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

48

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

49

{

50

public:

51

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

52

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

54

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, pretranspose, data_type);

Vidhya Sudhan Loganathan

2018-07-02 09:13:49 +0100

[diff] [blame]

55

_reference = compute_reference(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

60

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

61

{

62

switch(tensor.data_type())

{

case DataType::F16:

case DataType::F32:

{

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

67

std::uniform_real_distribution<> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

68

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

77

bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

78

{

79

// Create tensors

Vidhya Sudhan Loganathan

2018-07-02 09:13:49 +0100

[diff] [blame]

80

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

81

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

82

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

83

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

84

85

// Create and configure function

86

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

87

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

88

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

89

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

90

gemm.configure(&a,

91

&b,

92

(disable_c) ? nullptr : &c,

93

&dst,

94

alpha, beta,

95

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, (reinterpret_input_as_3d

96

|| reinterpret_output_as_3d)));

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

97

ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);

98

ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

99

ARM_COMPUTE_EXPECT(c.info()->is_resizable(), framework::LogLevel::ERRORS);

100

ARM_COMPUTE_EXPECT(dst.info()->is_resizable(), framework::LogLevel::ERRORS);

101

102

// Allocate tensors

103

a.allocator()->allocate();

104

b.allocator()->allocate();

105

c.allocator()->allocate();

106

dst.allocator()->allocate();

107

108

ARM_COMPUTE_EXPECT(!a.info()->is_resizable(), framework::LogLevel::ERRORS);

109

ARM_COMPUTE_EXPECT(!b.info()->is_resizable(), framework::LogLevel::ERRORS);

110

ARM_COMPUTE_EXPECT(!c.info()->is_resizable(), framework::LogLevel::ERRORS);

111

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

112

113

// Fill tensors

114

fill(AccessorType(a), 0);

115

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

116

if(!disable_c)

117

{

118

fill(AccessorType(c), 2);

119

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

120

121

// Compute GEMM function

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

2018-07-02 09:13:49 +0100

[diff] [blame]

128

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

129

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

130

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

131

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

132

if(reinterpret_input_as_3d)

133

{

134

// Collapse the second and third dimension if the input is 3D

135

shape_a_to_use.collapse(2U, 1U);

136

}

137

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

138

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

139

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

2018-07-02 09:13:49 +0100

[diff] [blame]

140

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

141

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

146

fill(c, 2);

147

148

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

149

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

150

const int n = shape_b[0];

151

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

152

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

153

154

// In case of broadcast, we need simply copy the first into the following "M" ones

155

for(int i = 1; i < m * batch_size; i++)

156

{

157

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

158

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

159

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

160

161

// Setting beta to 0 will effectively disable C for the

162

// computation of the reference: alpha * A * B + 0 * C

163

return reference::gemm<T>(a, b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

164

}

165

166

TensorType _target{};

167

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

168

};

169

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

170

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

171

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

172

{

173

public:

174

template <typename...>

175

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

176

DataType data_type, GPUTarget gpu_arch)

177

{

178

// Set the tensor shapes for LHS and RHS matrices

179

const TensorShape lhs_shape(k, m, batch_size);

180

const TensorShape rhs_shape(n, k, batch_size);

181

const TensorShape bias_shape(n,

182

broadcast_bias ? 1 : m,

183

broadcast_bias ? 1 : batch_size);

184

185

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

186

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

}

protected:

template <typename U>

191

void fill(U &&tensor, int i)

192

{

193

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

194

library->fill(tensor, distribution, i);

195

196

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

197

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

198

library->fill_borders_with_garbage(tensor, distribution_inf, i);

199

}

200

201

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

202

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

203

{

204

// Create tensors

205

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

206

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

207

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

208

TensorType dst;

209

210

const unsigned int m = lhs_shape[1];

211

const unsigned int n = rhs_shape[0];

212

const unsigned int k = lhs_shape[0];

213

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

214

215

// The output tensor will be auto-initialized within the function

216

217

// Create and configure function

218

GEMMFunctionType gemm;

219

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

220

221

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

222

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

223

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

224

225

// Allocate tensors

226

lhs.allocator()->allocate();

227

rhs.allocator()->allocate();

228

bias.allocator()->allocate();

229

dst.allocator()->allocate();

230

231

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

232

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

233

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

234

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

235

236

// Fill tensors

237

fill(AccessorType(lhs), 0);

238

fill(AccessorType(rhs), 1);

239

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

248

const ActivationLayerInfo &act_info)

249

{

250

TensorShape dst_shape = lhs_shape;

251

dst_shape[0] = rhs_shape[0];

252

dst_shape[1] = lhs_shape[1];

253

254

// Create reference

255

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

256

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

257

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

258

259

const int n = rhs_shape[0];

260

const int m = lhs_shape[1];

261

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

271

for(int i = 1; i < m * batch_size; i++)

272

{

273

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

278

}

279

280

TensorType _target{};

281

SimpleTensor<T> _reference{};

282

};

283

284

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

285

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

286

{

287

public:

288

template <typename...>

289

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

290

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

291

{

292

// In case of GEMM3D, m is the product between m_w and m_h

293

const unsigned int m = m_w * m_h;

294

295

// Set the tensor shapes for LHS and RHS matrices

296

const TensorShape lhs_shape(k, m, batch_size);

297

const TensorShape rhs_shape(n, k, batch_size);

298

const TensorShape bias_shape(n, 1, 1);

299

300

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

301

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

}

protected:

template <typename U>

306

void fill(U &&tensor, int i)

307

{

308

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

309

library->fill(tensor, distribution, i);

310

}

311

312

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

313

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

314

{

315

// Create tensors

316

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

317

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

318

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

319

TensorType dst;

320

321

const unsigned int m = lhs_shape[1];

322

const unsigned int n = rhs_shape[0];

323

const unsigned int k = lhs_shape[0];

324

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

325

326

// The output tensor will be auto-initialized within the function

327

328

// Create and configure function

329

GEMMFunctionType gemm;

330

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

331

332

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

333

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

334

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

335

336

// Allocate tensors

337

lhs.allocator()->allocate();

338

rhs.allocator()->allocate();

339

bias.allocator()->allocate();

340

dst.allocator()->allocate();

341

342

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

343

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

344

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

345

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

346

347

// Fill tensors

348

fill(AccessorType(lhs), 0);

349

fill(AccessorType(rhs), 1);

350

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

359

const ActivationLayerInfo &act_info)

360

{

361

TensorShape dst_shape = lhs_shape;

362

dst_shape.set(0, rhs_shape[0]);

363

dst_shape.set(1, lhs_shape[1] / m_h);

364

dst_shape.set(2, m_h);

365

dst_shape.set(3, lhs_shape[2]);

366

367

// Create reference

368

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

369

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

370

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

371

372

const int n = rhs_shape[0];

373

const int m = lhs_shape[1];

374

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

382

for(int i = 1; i < m * batch_size; i++)

383

{

384

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

385

}

386

387

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

388

}

389

390

TensorType _target{};

391

SimpleTensor<T> _reference{};

392

};

393

394

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

395

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

396

{

397

public:

398

template <typename...>

399

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

400

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

401

{

402

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

407

lhs_info.transpose = true;

408

409

GEMMRHSMatrixInfo rhs_info;

410

rhs_info.n0 = 16 / sizeof(T);

411

rhs_info.k0 = 1;

412

rhs_info.h0 = h0;

413

rhs_info.interleave = false;

414

rhs_info.transpose = false;

415

416

// Set the tensor shapes for LHS and RHS matrices

417

const TensorShape lhs_shape(k, m, batch_size);

418

const TensorShape rhs_shape(n, k, batch_size);

419

const TensorShape bias_shape(n,

420

broadcast_bias ? 1 : m,

421

broadcast_bias ? 1 : batch_size);

422

423

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

424

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

}

protected:

template <typename U>

429

void fill(U &&tensor, int i)

430

{

431

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

432

library->fill(tensor, distribution, i);

433

434

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

435

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

436

library->fill_borders_with_garbage(tensor, distribution_inf, i);

437

}

438

439

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

440

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

441

{

442

// Create tensors

443

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

444

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

445

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

446

TensorType lhs_reshaped;

447

TensorType rhs_reshaped;

448

TensorType dst;

449

450

const unsigned int m = lhs_shape[1];

451

const unsigned int n = rhs_shape[0];

452

const unsigned int k = lhs_shape[0];

453

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

454

455

// The output tensor will be auto-initialized within the function

456

457

// Create and configure function

458

ReshapeLHSFunctionType reshape_lhs;

459

ReshapeRHSFunctionType reshape_rhs;

460

GEMMFunctionType gemm;

461

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

462

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

463

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

464

465

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

466

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

467

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

468

469

// Allocate tensors

470

lhs.allocator()->allocate();

471

rhs.allocator()->allocate();

472

lhs_reshaped.allocator()->allocate();

473

rhs_reshaped.allocator()->allocate();

474

bias.allocator()->allocate();

475

dst.allocator()->allocate();

476

477

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

478

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

479

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

480

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

481

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

482

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

483

484

// Fill tensors

485

fill(AccessorType(lhs), 0);

486

fill(AccessorType(rhs), 1);

487

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

498

const ActivationLayerInfo &act_info)

499

{

500

TensorShape dst_shape = lhs_shape;

501

dst_shape[0] = rhs_shape[0];

502

dst_shape[1] = lhs_shape[1];

503

504

// Create reference

505

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

506

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

507

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

508

509

const int n = rhs_shape[0];

510

const int m = lhs_shape[1];

511

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

521

for(int i = 1; i < m * batch_size; i++)

522

{

523

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

528

}

529

530

TensorType _target{};

531

SimpleTensor<T> _reference{};

532

};

533

534

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

535

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

536

{

537

public:

538

template <typename...>

539

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

540

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

541

{

542

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

547

lhs_info.transpose = true;

548

549

GEMMRHSMatrixInfo rhs_info;

550

rhs_info.n0 = 16 / sizeof(T);

551

rhs_info.k0 = 1;

552

rhs_info.h0 = h0;

553

rhs_info.interleave = false;

554

rhs_info.transpose = false;

555

556

// In case of GEMM3D, m is the product between m_w and m_h

557

const unsigned int m = m_w * m_h;

558

559

// Set the tensor shapes for LHS and RHS matrices

560

const TensorShape lhs_shape(k, m, batch_size);

561

const TensorShape rhs_shape(n, k, batch_size);

562

const TensorShape bias_shape(n, 1, 1);

563

564

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

565

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

}

protected:

template <typename U>

570

void fill(U &&tensor, int i)

571

{

572

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

573

library->fill(tensor, distribution, i);

574

}

575

576

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

577

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

578

{

579

// Create tensors

580

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

581

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

582

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

583

TensorType lhs_reshaped;

584

TensorType rhs_reshaped;

585

TensorType dst;

586

587

const unsigned int m = lhs_shape[1];

588

const unsigned int n = rhs_shape[0];

589

const unsigned int k = lhs_shape[0];

590

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

591

592

// The output tensor will be auto-initialized within the function

593

594

// Create and configure function

595

ReshapeLHSFunctionType reshape_lhs;

596

ReshapeRHSFunctionType reshape_rhs;

597

GEMMFunctionType gemm;

598

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

599

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

600

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

601

602

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

603

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

604

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

605

606

// Allocate tensors

607

lhs.allocator()->allocate();

608

rhs.allocator()->allocate();

609

lhs_reshaped.allocator()->allocate();

610

rhs_reshaped.allocator()->allocate();

611

bias.allocator()->allocate();

612

dst.allocator()->allocate();

613

614

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

615

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

616

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

617

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

618

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

619

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

620

621

// Fill tensors

622

fill(AccessorType(lhs), 0);

623

fill(AccessorType(rhs), 1);

624

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

635

const ActivationLayerInfo &act_info)

636

{

637

TensorShape dst_shape = lhs_shape;

638

dst_shape.set(0, rhs_shape[0]);

639

dst_shape.set(1, lhs_shape[1] / m_h);

640

dst_shape.set(2, m_h);

641

dst_shape.set(3, lhs_shape[2]);

642

643

// Create reference

644

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

645

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

646

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

647

648

const int n = rhs_shape[0];

649

const int m = lhs_shape[1];

650

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

658

for(int i = 1; i < m * batch_size; i++)

659

{

660

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

661

}

662

663

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

664

}

665

666

TensorType _target{};

667

SimpleTensor<T> _reference{};

668

};

669

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

670

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

671

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

672

{

673

public:

674

template <typename...>

675

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

676

bool interleave_rhs, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

677

{

678

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

683

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

684

685

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

690

rhs_info.transpose = !lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

691

692

// Set the tensor shapes for LHS and RHS matrices

693

const TensorShape lhs_shape(k, m, batch_size);

694

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

695

const TensorShape bias_shape(n,

696

broadcast_bias ? 1 : m,

697

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

698

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

699

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

700

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

705

void fill(U &&tensor, int i)

706

{

707

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

708

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

709

710

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

711

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

712

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

713

}

714

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

715

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

716

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

717

{

718

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

719

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

720

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

721

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

722

TensorType lhs_reshaped;

723

TensorType rhs_reshaped;

724

TensorType dst;

725

726

const unsigned int M = lhs_shape[1];

727

const unsigned int N = rhs_shape[0];

728

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

729

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

734

kernel_info.reinterpret_input_as_3d = false;

735

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

736

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

737

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

738

739

// The output tensor will be auto-initialized within the function

740

741

// Create and configure function

742

ReshapeLHSFunctionType reshape_lhs;

743

ReshapeRHSFunctionType reshape_rhs;

744

GEMMFunctionType gemm;

745

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

746

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

747

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

748

749

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

750

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

751

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

752

753

// Allocate tensors

754

lhs.allocator()->allocate();

755

rhs.allocator()->allocate();

756

lhs_reshaped.allocator()->allocate();

757

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

758

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

759

dst.allocator()->allocate();

760

761

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

762

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

763

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

764

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

765

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

766

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

767

768

// Fill tensors

769

fill(AccessorType(lhs), 0);

770

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

771

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

781

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

782

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

783

{

784

TensorShape dst_shape = lhs_shape;

785

dst_shape[0] = rhs_shape[0];

786

dst_shape[1] = lhs_shape[1];

787

788

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

789

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

790

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

791

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

792

793

const int n = rhs_shape[0];

794

const int m = lhs_shape[1];

795

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

800

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

801

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

802

if(broadcast_bias)

803

{

804

// In case of broadcast, we need simply copy the first into the following "M" ones

805

for(int i = 1; i < m * batch_size; i++)

806

{

807

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

811

if(fp_mixed_precision)

812

{

813

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

818

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

819

}

820

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

821

TensorType _target{};

822

SimpleTensor<T> _reference{};

823

};

824

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

825

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

826

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

827

{

828

public:

829

template <typename...>

830

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

831

bool interleave_lhs,

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

832

bool interleave_rhs, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

833

{

834

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

839

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

840

841

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

846

rhs_info.transpose = !lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

847

848

// In case of GEMM3D, m is the product between m_w and m_h

849

const unsigned int m = m_w * m_h;

850

851

// Set the tensor shapes for LHS and RHS matrices

852

const TensorShape lhs_shape(k, m, batch_size);

853

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

854

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

855

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

856

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

857

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

862

void fill(U &&tensor, int i)

863

{

864

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

865

library->fill(tensor, distribution, i);

866

}

867

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

868

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

869

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

870

{

871

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

872

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

873

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

874

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

875

TensorType lhs_reshaped;

876

TensorType rhs_reshaped;

877

TensorType dst;

878

879

const unsigned int M = lhs_shape[1];

880

const unsigned int N = rhs_shape[0];

881

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

882

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

887

kernel_info.reinterpret_input_as_3d = false;

888

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

889

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

890

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

891

892

// The output tensor will be auto-initialized within the function

893

894

// Create and configure function

895

ReshapeLHSFunctionType reshape_lhs;

896

ReshapeRHSFunctionType reshape_rhs;

897

GEMMFunctionType gemm;

898

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

899

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

900

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

901

902

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

903

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

904

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

905

906

// Allocate tensors

907

lhs.allocator()->allocate();

908

rhs.allocator()->allocate();

909

lhs_reshaped.allocator()->allocate();

910

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

911

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

912

dst.allocator()->allocate();

913

914

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

915

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

916

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

917

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

918

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

919

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

920

921

// Fill tensors

922

fill(AccessorType(lhs), 0);

923

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

924

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

934

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

935

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

936

{

937

TensorShape dst_shape = lhs_shape;

938

dst_shape.set(0, rhs_shape[0]);

939

dst_shape.set(1, lhs_shape[1] / m_h);

940

dst_shape.set(2, m_h);

941

dst_shape.set(3, lhs_shape[2]);

942

943

// Create reference

944

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

945

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

946

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

947

948

const int n = rhs_shape[0];

949

const int m = lhs_shape[1];

950

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

955

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

956

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

957

// In case of broadcast, we need simply copy the first into the following "M" ones

958

for(int i = 1; i < m * batch_size; i++)

959

{

960

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

961

}

962

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

963

if(fp_mixed_precision)

964

{

965

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

970

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

971

}

972

973

TensorType _target{};

974

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

975

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

976

977

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

978

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

979

{

980

public:

981

template <typename...>

982

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

983

bool interleave_rhs, bool transpose_rhs, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

984

{

985

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

994

rhs_info.transpose = transpose_rhs;

995

996

// Set the tensor shapes for LHS and RHS matrices

997

const TensorShape lhs_shape(k, m, batch_size);

998

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

999

const TensorShape bias_shape(n,

1000

broadcast_bias ? 1 : m,

1001

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1002

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1003

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1004

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1009

void fill(U &&tensor, int i)

1010

{

1011

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1012

library->fill(tensor, distribution, i);

1013

1014

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1015

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1016

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1017

}

1018

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1019

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1020

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1021

{

1022

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1023

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1024

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1025

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1026

TensorType rhs_reshaped;

1027

TensorType dst;

1028

1029

const unsigned int M = lhs_shape[1];

1030

const unsigned int N = rhs_shape[0];

1031

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1032

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1037

kernel_info.reinterpret_input_as_3d = false;

1038

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1039

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1040

1041

// The output tensor will be auto-initialized within the function

1042

1043

// Create and configure function

1044

ReshapeRHSFunctionType reshape_rhs;

1045

GEMMFunctionType gemm;

1046

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1047

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1048

1049

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1050

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1051

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1052

1053

// Allocate tensors

1054

lhs.allocator()->allocate();

1055

rhs.allocator()->allocate();

1056

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1057

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1058

dst.allocator()->allocate();

1059

1060

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1061

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1062

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1063

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1064

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1065

1066

// Fill tensors

1067

fill(AccessorType(lhs), 0);

1068

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1069

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1078

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1079

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1080

{

1081

TensorShape dst_shape = lhs_shape;

1082

dst_shape[0] = rhs_shape[0];

1083

dst_shape[1] = lhs_shape[1];

1084

1085

// Create reference

1086

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1087

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1088

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1089

1090

const int n = rhs_shape[0];

1091

const int m = lhs_shape[1];

1092

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1097

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1098

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1099

if(broadcast_bias)

1100

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1101

// In case of broadcast, we need simply copy the first into the following "M" ones

1102

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1103

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1104

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1105

}

1106

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1107

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1108

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1109

}

1110

1111

TensorType _target{};

1112

SimpleTensor<T> _reference{};

1113

};

1114

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1115

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

1116

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1117

{

1118

public:

1119

template <typename...>

1120

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1121

bool interleave_rhs, bool transpose_rhs, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1122

{

1123

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1132

rhs_info.transpose = transpose_rhs;

1133

1134

// In case of GEMM3D, m is the product between m_w and m_h

1135

const unsigned int m = m_w * m_h;

1136

1137

// Set the tensor shapes for LHS and RHS matrices

1138

const TensorShape lhs_shape(k, m, batch_size);

1139

const TensorShape rhs_shape(n, k, batch_size);

1140

const TensorShape bias_shape(n, 1, 1);

1141

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1142

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

1143

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1148

void fill(U &&tensor, int i)

1149

{

1150

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1151

library->fill(tensor, distribution, i);

1152

}

1153

1154

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1155

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1156

unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1157

{

1158

// Create tensors

1159

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1160

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1161

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1162

TensorType rhs_reshaped;

1163

TensorType dst;

1164

1165

const unsigned int M = lhs_shape[1];

1166

const unsigned int N = rhs_shape[0];

1167

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1168

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1173

kernel_info.reinterpret_input_as_3d = false;

1174

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1175

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1176

1177

// The output tensor will be auto-initialized within the function

1178

1179

// Create and configure function

1180

ReshapeRHSFunctionType reshape_rhs;

1181

GEMMFunctionType gemm;

1182

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1183

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1184

1185

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1186

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1187

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1188

1189

// Allocate tensors

1190

lhs.allocator()->allocate();

1191

rhs.allocator()->allocate();

1192

rhs_reshaped.allocator()->allocate();

1193

bias.allocator()->allocate();

1194

dst.allocator()->allocate();

1195

1196

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1197

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1198

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

1199

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1200

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1201

1202

// Fill tensors

1203

fill(AccessorType(lhs), 0);

1204

fill(AccessorType(rhs), 1);

1205

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1214

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

1215

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1216

{

1217

TensorShape dst_shape = lhs_shape;

1218

dst_shape.set(0, rhs_shape[0]);

1219

dst_shape.set(1, lhs_shape[1] / m_h);

1220

dst_shape.set(2, m_h);

1221

dst_shape.set(3, lhs_shape[2]);

1222

1223

// Create reference

1224

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1225

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1226

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1227

1228

const int n = rhs_shape[0];

1229

const int m = lhs_shape[1];

1230

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

1238

for(int i = 1; i < m * batch_size; i++)

1239

{

1240

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1241

}

1242

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1243

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1244

}

1245

1246

TensorType _target{};

1247

SimpleTensor<T> _reference{};

1248

};

1249

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1250

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1251

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1252

{

1253

public:

1254

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1255

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1256

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1257

{

1258

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1267

const TensorShape lhs_shape(k, m, batch_size);

1268

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1269

const TensorShape bias_shape(n,

1270

broadcast_bias ? 1 : m,

1271

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1272

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1273

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1274

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1279

void fill(U &&tensor, int i)

1280

{

1281

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1282

library->fill(tensor, distribution, i);

1283

1284

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1285

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1286

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1287

}

1288

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1289

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1290

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1291

{

1292

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1293

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1294

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1295

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1296

TensorType dst;

1297

1298

const unsigned int M = lhs_shape[1];

1299

const unsigned int N = rhs_shape[0];

1300

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1301

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1306

kernel_info.reinterpret_input_as_3d = false;

1307

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1308

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1309

1310

// Create and configure function

1311

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1312

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1313

1314

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1315

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1316

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1317

1318

// Allocate tensors

1319

lhs.allocator()->allocate();

1320

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1321

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1322

dst.allocator()->allocate();

1323

1324

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1325

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1326

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1327

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1328

1329

// Fill tensors

1330

fill(AccessorType(lhs), 0);

1331

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1332

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1340

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1341

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1342

{

1343

TensorShape dst_shape = lhs_shape;

1344

dst_shape[0] = rhs_shape[0];

1345

dst_shape[1] = lhs_shape[1];

1346

1347

// Create reference

1348

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1349

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1350

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1351

1352

const int n = rhs_shape[0];

1353

const int m = lhs_shape[1];

1354

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1359

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1360

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1361

if(broadcast_bias)

1362

{

1363

// In case of broadcast, we need simply copy the first into the following "M" ones

1364

for(int i = 1; i < m * batch_size; i++)

1365

{

1366

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1370

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1371

}

1372

1373

TensorType _target{};

1374

SimpleTensor<T> _reference{};

1375

};

1376

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1377

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1378

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

1379

{

1380

public:

1381

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1382

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

1383

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1384

{

1385

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

1394

const unsigned int m = m_w * m_h;

1395

1396

// Set the tensor shapes for LHS and RHS matrices

1397

const TensorShape lhs_shape(k, m, batch_size);

1398

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1399

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1400

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1401

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

1402

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1407

void fill(U &&tensor, int i)

1408

{

1409

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1410

library->fill(tensor, distribution, i);

1411

}

1412

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1413

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1414

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1415

{

1416

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1417

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1418

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1419

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1420

TensorType dst;

1421

1422

const unsigned int M = lhs_shape[1];

1423

const unsigned int N = rhs_shape[0];

1424

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1425

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1430

kernel_info.reinterpret_input_as_3d = false;

1431

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1432

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1433

1434

// The output tensor will be auto-initialized within the function

1435

1436

// Create and configure function

1437

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1438

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1439

1440

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1441

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1442

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1443

1444

// Allocate tensors

1445

lhs.allocator()->allocate();

1446

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1447

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1448

dst.allocator()->allocate();

1449

1450

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1451

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1452

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1453

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1454

1455

// Fill tensors

1456

fill(AccessorType(lhs), 0);

1457

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1458

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1466

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

1467

const ActivationLayerInfo &act_info)

giuros01