Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

48

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

49

{

50

public:

51

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

52

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

54

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, pretranspose, data_type);

Vidhya Sudhan Loganathan

2018-07-02 09:13:49 +0100

[diff] [blame]

55

_reference = compute_reference(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

60

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

61

{

62

switch(tensor.data_type())

{

case DataType::F16:

case DataType::F32:

{

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

67

std::uniform_real_distribution<> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

68

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

77

bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

78

{

79

// Create tensors

Vidhya Sudhan Loganathan

2018-07-02 09:13:49 +0100

[diff] [blame]

80

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

81

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

82

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

83

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

84

85

// Create and configure function

86

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

87

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

88

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

89

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame^]

90

gemm.configure(&a,

91

&b,

92

(disable_c) ? nullptr : &c,

93

&dst,

94

alpha, beta,

95

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, (reinterpret_input_as_3d

96

|| reinterpret_output_as_3d)));

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

97

ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);

98

ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

99

ARM_COMPUTE_EXPECT(c.info()->is_resizable(), framework::LogLevel::ERRORS);

100

ARM_COMPUTE_EXPECT(dst.info()->is_resizable(), framework::LogLevel::ERRORS);

101

102

// Allocate tensors

103

a.allocator()->allocate();

104

b.allocator()->allocate();

105

c.allocator()->allocate();

106

dst.allocator()->allocate();

107

108

ARM_COMPUTE_EXPECT(!a.info()->is_resizable(), framework::LogLevel::ERRORS);

109

ARM_COMPUTE_EXPECT(!b.info()->is_resizable(), framework::LogLevel::ERRORS);

110

ARM_COMPUTE_EXPECT(!c.info()->is_resizable(), framework::LogLevel::ERRORS);

111

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

112

113

// Fill tensors

114

fill(AccessorType(a), 0);

115

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

116

if(!disable_c)

117

{

118

fill(AccessorType(c), 2);

119

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

120

121

// Compute GEMM function

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

2018-07-02 09:13:49 +0100

[diff] [blame]

128

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

129

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

130

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame^]

131

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

132

if(reinterpret_input_as_3d)

133

{

134

// Collapse the second and third dimension if the input is 3D

135

shape_a_to_use.collapse(2U, 1U);

136

}

137

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

138

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

139

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

2018-07-02 09:13:49 +0100

[diff] [blame]

140

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame^]

141

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame^]

146

fill(c, 2);

147

148

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

149

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame^]

150

const int n = shape_b[0];

151

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

152

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

153

154

// In case of broadcast, we need simply copy the first into the following "M" ones

155

for(int i = 1; i < m * batch_size; i++)

156

{

157

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

158

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

159

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame^]

160

161

// Setting beta to 0 will effectively disable C for the

162

// computation of the reference: alpha * A * B + 0 * C

163

return reference::gemm<T>(a, b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

164

}

165

166

TensorType _target{};

167

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

168

};

169

Gian Marco Iodice

d1f5476

2019-07-19 09:54:47 +0100

[diff] [blame]

170

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

171

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

172

{

173

public:

174

template <typename...>

175

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

176

DataType data_type, GPUTarget gpu_arch)

177

{

178

// Set the tensor shapes for LHS and RHS matrices

179

const TensorShape lhs_shape(k, m, batch_size);

180

const TensorShape rhs_shape(n, k, batch_size);

181

const TensorShape bias_shape(n,

182

broadcast_bias ? 1 : m,

183

broadcast_bias ? 1 : batch_size);

184

185

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

186

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

}

protected:

template <typename U>

191

void fill(U &&tensor, int i)

192

{

193

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

194

library->fill(tensor, distribution, i);

195

196

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

197

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

198

library->fill_borders_with_garbage(tensor, distribution_inf, i);

199

}

200

201

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

202

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

203

{

204

// Create tensors

205

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

206

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

207

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

208

TensorType dst;

209

210

const unsigned int m = lhs_shape[1];

211

const unsigned int n = rhs_shape[0];

212

const unsigned int k = lhs_shape[0];

213

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

214

215

// The output tensor will be auto-initialized within the function

216

217

// Create and configure function

218

GEMMFunctionType gemm;

219

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

220

221

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

222

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

223

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

224

225

// Allocate tensors

226

lhs.allocator()->allocate();

227

rhs.allocator()->allocate();

228

bias.allocator()->allocate();

229

dst.allocator()->allocate();

230

231

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

232

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

233

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

234

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

235

236

// Fill tensors

237

fill(AccessorType(lhs), 0);

238

fill(AccessorType(rhs), 1);

239

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

248

const ActivationLayerInfo &act_info)

249

{

250

TensorShape dst_shape = lhs_shape;

251

dst_shape[0] = rhs_shape[0];

252

dst_shape[1] = lhs_shape[1];

253

254

// Create reference

255

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

256

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

257

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

258

259

const int n = rhs_shape[0];

260

const int m = lhs_shape[1];

261

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

271

for(int i = 1; i < m * batch_size; i++)

272

{

273

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

278

}

279

280

TensorType _target{};

281

SimpleTensor<T> _reference{};

282

};

283

284

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

285

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

286

{

287

public:

288

template <typename...>

289

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

290

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

291

{

292

// In case of GEMM3D, m is the product between m_w and m_h

293

const unsigned int m = m_w * m_h;

294

295

// Set the tensor shapes for LHS and RHS matrices

296

const TensorShape lhs_shape(k, m, batch_size);

297

const TensorShape rhs_shape(n, k, batch_size);

298

const TensorShape bias_shape(n, 1, 1);

299

300

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

301

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

}

protected:

template <typename U>

306

void fill(U &&tensor, int i)

307

{

308

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

309

library->fill(tensor, distribution, i);

310

}

311

312

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

313

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

314

{

315

// Create tensors

316

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

317

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

318

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

319

TensorType dst;

320

321

const unsigned int m = lhs_shape[1];

322

const unsigned int n = rhs_shape[0];

323

const unsigned int k = lhs_shape[0];

324

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

325

326

// The output tensor will be auto-initialized within the function

327

328

// Create and configure function

329

GEMMFunctionType gemm;

330

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

331

332

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

333

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

334

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

335

336

// Allocate tensors

337

lhs.allocator()->allocate();

338

rhs.allocator()->allocate();

339

bias.allocator()->allocate();

340

dst.allocator()->allocate();

341

342

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

343

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

344

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

345

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

346

347

// Fill tensors

348

fill(AccessorType(lhs), 0);

349

fill(AccessorType(rhs), 1);

350

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

359

const ActivationLayerInfo &act_info)

360

{

361

TensorShape dst_shape = lhs_shape;

362

dst_shape.set(0, rhs_shape[0]);

363

dst_shape.set(1, lhs_shape[1] / m_h);

364

dst_shape.set(2, m_h);

365

dst_shape.set(3, lhs_shape[2]);

366

367

// Create reference

368

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

369

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

370

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

371

372

const int n = rhs_shape[0];

373

const int m = lhs_shape[1];

374

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

382

for(int i = 1; i < m * batch_size; i++)

383

{

384

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

385

}

386

387

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

388

}

389

390

TensorType _target{};

391

SimpleTensor<T> _reference{};

392

};

393

394

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

395

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

396

{

397

public:

398

template <typename...>

399

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

400

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

401

{

402

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

407

lhs_info.transpose = true;

408

409

GEMMRHSMatrixInfo rhs_info;

410

rhs_info.n0 = 16 / sizeof(T);

411

rhs_info.k0 = 1;

412

rhs_info.h0 = h0;

413

rhs_info.interleave = false;

414

rhs_info.transpose = false;

415

416

// Set the tensor shapes for LHS and RHS matrices

417

const TensorShape lhs_shape(k, m, batch_size);

418

const TensorShape rhs_shape(n, k, batch_size);

419

const TensorShape bias_shape(n,

420

broadcast_bias ? 1 : m,

421

broadcast_bias ? 1 : batch_size);

422

423

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

424

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

}

protected:

template <typename U>

429

void fill(U &&tensor, int i)

430

{

431

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

432

library->fill(tensor, distribution, i);

433

434

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

435

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

436

library->fill_borders_with_garbage(tensor, distribution_inf, i);

437

}

438

439

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

440

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

441

{

442

// Create tensors

443

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

444

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

445

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

446

TensorType lhs_reshaped;

447

TensorType rhs_reshaped;

448

TensorType dst;

449

450

const unsigned int m = lhs_shape[1];

451

const unsigned int n = rhs_shape[0];

452

const unsigned int k = lhs_shape[0];

453

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

454

455

// The output tensor will be auto-initialized within the function

456

457

// Create and configure function

458

ReshapeLHSFunctionType reshape_lhs;

459

ReshapeRHSFunctionType reshape_rhs;

460

GEMMFunctionType gemm;

461

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

462

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

463

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

464

465

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

466

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

467

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

468

469

// Allocate tensors

470

lhs.allocator()->allocate();

471

rhs.allocator()->allocate();

472

lhs_reshaped.allocator()->allocate();

473

rhs_reshaped.allocator()->allocate();

474

bias.allocator()->allocate();

475

dst.allocator()->allocate();

476

477

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

478

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

479

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

480

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

481

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

482

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

483

484

// Fill tensors

485

fill(AccessorType(lhs), 0);

486

fill(AccessorType(rhs), 1);

487

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

498

const ActivationLayerInfo &act_info)

499

{

500

TensorShape dst_shape = lhs_shape;

501

dst_shape[0] = rhs_shape[0];

502

dst_shape[1] = lhs_shape[1];

503

504

// Create reference

505

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

506

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

507

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

508

509

const int n = rhs_shape[0];

510

const int m = lhs_shape[1];

511

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

521

for(int i = 1; i < m * batch_size; i++)

522

{

523

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

528

}

529

530

TensorType _target{};

531

SimpleTensor<T> _reference{};

532

};

533

534

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

535

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

536

{

537

public:

538

template <typename...>

539

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

540

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

541

{

542

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

547

lhs_info.transpose = true;

548

549

GEMMRHSMatrixInfo rhs_info;

550

rhs_info.n0 = 16 / sizeof(T);

551

rhs_info.k0 = 1;

552

rhs_info.h0 = h0;

553

rhs_info.interleave = false;

554

rhs_info.transpose = false;

555

556

// In case of GEMM3D, m is the product between m_w and m_h

557

const unsigned int m = m_w * m_h;

558

559

// Set the tensor shapes for LHS and RHS matrices

560

const TensorShape lhs_shape(k, m, batch_size);

561

const TensorShape rhs_shape(n, k, batch_size);

562

const TensorShape bias_shape(n, 1, 1);

563

564

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

565

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

}

protected:

template <typename U>

570

void fill(U &&tensor, int i)

571

{

572

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

573

library->fill(tensor, distribution, i);

574

}

575

576

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

577

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

578

{

579

// Create tensors

580

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

581

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

582

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

583

TensorType lhs_reshaped;

584

TensorType rhs_reshaped;

585

TensorType dst;

586

587

const unsigned int m = lhs_shape[1];

588

const unsigned int n = rhs_shape[0];

589

const unsigned int k = lhs_shape[0];

590

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

591

592

// The output tensor will be auto-initialized within the function

593

594

// Create and configure function

595

ReshapeLHSFunctionType reshape_lhs;

596

ReshapeRHSFunctionType reshape_rhs;

597

GEMMFunctionType gemm;

598

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

599

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

600

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

601

602

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

603

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

604

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

605

606

// Allocate tensors

607

lhs.allocator()->allocate();

608

rhs.allocator()->allocate();

609

lhs_reshaped.allocator()->allocate();

610

rhs_reshaped.allocator()->allocate();

611

bias.allocator()->allocate();

612

dst.allocator()->allocate();

613

614

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

615

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

616

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

617

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

618

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

619

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

620

621

// Fill tensors

622

fill(AccessorType(lhs), 0);

623

fill(AccessorType(rhs), 1);

624

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

635

const ActivationLayerInfo &act_info)

636

{

637

TensorShape dst_shape = lhs_shape;

638

dst_shape.set(0, rhs_shape[0]);

639

dst_shape.set(1, lhs_shape[1] / m_h);

640

dst_shape.set(2, m_h);

641

dst_shape.set(3, lhs_shape[2]);

642

643

// Create reference

644

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

645

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

646

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

647

648

const int n = rhs_shape[0];

649

const int m = lhs_shape[1];

650

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

658

for(int i = 1; i < m * batch_size; i++)

659

{

660

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

661

}

662

663

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

664

}

665

666

TensorType _target{};

667

SimpleTensor<T> _reference{};

668

};

669

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

670

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

671

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

672

{

673

public:

674

template <typename...>

675

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

676

bool interleave_rhs, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

677

{

678

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

683

lhs_info.transpose = false;

684

685

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

690

rhs_info.transpose = true;

691

692

// Set the tensor shapes for LHS and RHS matrices

693

const TensorShape lhs_shape(k, m, batch_size);

694

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

695

const TensorShape bias_shape(n,

696

broadcast_bias ? 1 : m,

697

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

698

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

699

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

700

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

705

void fill(U &&tensor, int i)

706

{

707

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

708

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

709

710

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

711

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

712

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

713

}

714

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

715

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

716

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

717

{

718

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

719

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

720

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

721

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

722

TensorType lhs_reshaped;

723

TensorType rhs_reshaped;

724

TensorType dst;

725

726

const unsigned int M = lhs_shape[1];

727

const unsigned int N = rhs_shape[0];

728

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

729

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

734

kernel_info.reinterpret_input_as_3d = false;

735

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

736

kernel_info.activation_info = act_info;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

737

738

// The output tensor will be auto-initialized within the function

739

740

// Create and configure function

741

ReshapeLHSFunctionType reshape_lhs;

742

ReshapeRHSFunctionType reshape_rhs;

743

GEMMFunctionType gemm;

744

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

745

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

746

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

747

748

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

749

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

750

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

751

752

// Allocate tensors

753

lhs.allocator()->allocate();

754

rhs.allocator()->allocate();

755

lhs_reshaped.allocator()->allocate();

756

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

757

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

758

dst.allocator()->allocate();

759

760

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

761

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

762

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

763

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

764

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

765

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

766

767

// Fill tensors

768

fill(AccessorType(lhs), 0);

769

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

770

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

780

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

781

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

782

{

783

TensorShape dst_shape = lhs_shape;

784

dst_shape[0] = rhs_shape[0];

785

dst_shape[1] = lhs_shape[1];

786

787

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

788

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

789

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

790

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

791

792

const int n = rhs_shape[0];

793

const int m = lhs_shape[1];

794

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

799

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

800

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

801

if(broadcast_bias)

802

{

803

// In case of broadcast, we need simply copy the first into the following "M" ones

804

for(int i = 1; i < m * batch_size; i++)

805

{

806

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

810

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

811

}

812

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

813

TensorType _target{};

814

SimpleTensor<T> _reference{};

815

};

816

817

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

818

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

819

{

820

public:

821

template <typename...>

822

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

823

bool interleave_lhs,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

824

bool interleave_rhs, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

825

{

826

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

831

lhs_info.transpose = false;

832

833

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

838

rhs_info.transpose = true;

839

840

// In case of GEMM3D, m is the product between m_w and m_h

841

const unsigned int m = m_w * m_h;

842

843

// Set the tensor shapes for LHS and RHS matrices

844

const TensorShape lhs_shape(k, m, batch_size);

845

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

846

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

847

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

848

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

849

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

854

void fill(U &&tensor, int i)

855

{

856

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

857

library->fill(tensor, distribution, i);

858

}

859

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

860

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

861

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

862

{

863

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

864

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

865

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

866

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

867

TensorType lhs_reshaped;

868

TensorType rhs_reshaped;

869

TensorType dst;

870

871

const unsigned int M = lhs_shape[1];

872

const unsigned int N = rhs_shape[0];

873

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

874

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

879

kernel_info.reinterpret_input_as_3d = false;

880

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

881

kernel_info.activation_info = act_info;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

882

883

// The output tensor will be auto-initialized within the function

884

885

// Create and configure function

886

ReshapeLHSFunctionType reshape_lhs;

887

ReshapeRHSFunctionType reshape_rhs;

888

GEMMFunctionType gemm;

889

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

890

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

891

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

892

893

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

894

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

895

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

896

897

// Allocate tensors

898

lhs.allocator()->allocate();

899

rhs.allocator()->allocate();

900

lhs_reshaped.allocator()->allocate();

901

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

902

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

903

dst.allocator()->allocate();

904

905

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

906

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

907

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

908

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

909

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

910

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

911

912

// Fill tensors

913

fill(AccessorType(lhs), 0);

914

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

915

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

925

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

926

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

927

{

928

TensorShape dst_shape = lhs_shape;

929

dst_shape.set(0, rhs_shape[0]);

930

dst_shape.set(1, lhs_shape[1] / m_h);

931

dst_shape.set(2, m_h);

932

dst_shape.set(3, lhs_shape[2]);

933

934

// Create reference

935

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

936

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

937

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

938

939

const int n = rhs_shape[0];

940

const int m = lhs_shape[1];

941

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

946

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

947

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

948

// In case of broadcast, we need simply copy the first into the following "M" ones

949

for(int i = 1; i < m * batch_size; i++)

950

{

951

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

952

}

953

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

954

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

955

}

956

957

TensorType _target{};

958

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

959

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

960

961

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

962

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

963

{

964

public:

965

template <typename...>

966

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

967

bool interleave_rhs, bool transpose_rhs, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

968

{

969

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

978

rhs_info.transpose = transpose_rhs;

979

980

// Set the tensor shapes for LHS and RHS matrices

981

const TensorShape lhs_shape(k, m, batch_size);

982

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

983

const TensorShape bias_shape(n,

984

broadcast_bias ? 1 : m,

985

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

986

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

987

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

988

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

993

void fill(U &&tensor, int i)

994

{

995

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

996

library->fill(tensor, distribution, i);

997

998

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

999

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1000

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1001

}

1002

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1003

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1004

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1005

{

1006

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1007

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1008

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1009

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1010

TensorType rhs_reshaped;

1011

TensorType dst;

1012

1013

const unsigned int M = lhs_shape[1];

1014

const unsigned int N = rhs_shape[0];

1015

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1016

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1021

kernel_info.reinterpret_input_as_3d = false;

1022

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1023

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1024

1025

// The output tensor will be auto-initialized within the function

1026

1027

// Create and configure function

1028

ReshapeRHSFunctionType reshape_rhs;

1029

GEMMFunctionType gemm;

1030

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1031

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1032

1033

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1034

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1035

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1036

1037

// Allocate tensors

1038

lhs.allocator()->allocate();

1039

rhs.allocator()->allocate();

1040

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1041

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1042

dst.allocator()->allocate();

1043

1044

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1045

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1046

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1047

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1048

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1049

1050

// Fill tensors

1051

fill(AccessorType(lhs), 0);

1052

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1053

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1062

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1063

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1064

{

1065

TensorShape dst_shape = lhs_shape;

1066

dst_shape[0] = rhs_shape[0];

1067

dst_shape[1] = lhs_shape[1];

1068

1069

// Create reference

1070

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1071

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1072

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1073

1074

const int n = rhs_shape[0];

1075

const int m = lhs_shape[1];

1076

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1081

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1082

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1083

if(broadcast_bias)

1084

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1085

// In case of broadcast, we need simply copy the first into the following "M" ones

1086

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1087

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1088

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1089

}

1090

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1091

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1092

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1093

}

1094

1095

TensorType _target{};

1096

SimpleTensor<T> _reference{};

1097

};

1098

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1099

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

1100

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1101

{

1102

public:

1103

template <typename...>

1104

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1105

bool interleave_rhs, bool transpose_rhs, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1106

{

1107

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1116

rhs_info.transpose = transpose_rhs;

1117

1118

// In case of GEMM3D, m is the product between m_w and m_h

1119

const unsigned int m = m_w * m_h;

1120

1121

// Set the tensor shapes for LHS and RHS matrices

1122

const TensorShape lhs_shape(k, m, batch_size);

1123

const TensorShape rhs_shape(n, k, batch_size);

1124

const TensorShape bias_shape(n, 1, 1);

1125

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1126

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

1127

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1132

void fill(U &&tensor, int i)

1133

{

1134

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1135

library->fill(tensor, distribution, i);

1136

}

1137

1138

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1139

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1140

unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1141

{

1142

// Create tensors

1143

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1144

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1145

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1146

TensorType rhs_reshaped;

1147

TensorType dst;

1148

1149

const unsigned int M = lhs_shape[1];

1150

const unsigned int N = rhs_shape[0];

1151

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1152

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1157

kernel_info.reinterpret_input_as_3d = false;

1158

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1159

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1160

1161

// The output tensor will be auto-initialized within the function

1162

1163

// Create and configure function

1164

ReshapeRHSFunctionType reshape_rhs;

1165

GEMMFunctionType gemm;

1166

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1167

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1168

1169

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1170

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1171

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1172

1173

// Allocate tensors

1174

lhs.allocator()->allocate();

1175

rhs.allocator()->allocate();

1176

rhs_reshaped.allocator()->allocate();

1177

bias.allocator()->allocate();

1178

dst.allocator()->allocate();

1179

1180

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1181

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1182

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

1183

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1184

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1185

1186

// Fill tensors

1187

fill(AccessorType(lhs), 0);

1188

fill(AccessorType(rhs), 1);

1189

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1198

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

1199

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1200

{

1201

TensorShape dst_shape = lhs_shape;

1202

dst_shape.set(0, rhs_shape[0]);

1203

dst_shape.set(1, lhs_shape[1] / m_h);

1204

dst_shape.set(2, m_h);

1205

dst_shape.set(3, lhs_shape[2]);

1206

1207

// Create reference

1208

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1209

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1210

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1211

1212

const int n = rhs_shape[0];

1213

const int m = lhs_shape[1];

1214

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

1222

for(int i = 1; i < m * batch_size; i++)

1223

{

1224

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1225

}

1226

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1227

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1228

}

1229

1230

TensorType _target{};

1231

SimpleTensor<T> _reference{};

1232

};

1233

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1234

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1235

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1236

{

1237

public:

1238

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1239

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1240

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1241

{

1242

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1251

const TensorShape lhs_shape(k, m, batch_size);

1252

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1253

const TensorShape bias_shape(n,

1254

broadcast_bias ? 1 : m,

1255

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1256

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1257

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1258

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1263

void fill(U &&tensor, int i)

1264

{

1265

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1266

library->fill(tensor, distribution, i);

1267

1268

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1269

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1270

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1271

}

1272

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1273

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1274

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1275

{

1276

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1277

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1278

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1279

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1280

TensorType dst;

1281

1282

const unsigned int M = lhs_shape[1];

1283

const unsigned int N = rhs_shape[0];

1284

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1285

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1290

kernel_info.reinterpret_input_as_3d = false;

1291

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1292

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1293

1294

// Create and configure function

1295

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1296

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1297

1298

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1299

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1300

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1301

1302

// Allocate tensors

1303

lhs.allocator()->allocate();

1304

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1305

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1306

dst.allocator()->allocate();

1307

1308

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1309

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1310

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1311

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1312

1313

// Fill tensors

1314

fill(AccessorType(lhs), 0);

1315

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1316

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1324

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1325

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1326

{

1327

TensorShape dst_shape = lhs_shape;

1328

dst_shape[0] = rhs_shape[0];

1329

dst_shape[1] = lhs_shape[1];

1330

1331

// Create reference

1332

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1333

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1334

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1335

1336

const int n = rhs_shape[0];

1337

const int m = lhs_shape[1];

1338

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1343

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1344

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1345

if(broadcast_bias)

1346

{

1347

// In case of broadcast, we need simply copy the first into the following "M" ones

1348

for(int i = 1; i < m * batch_size; i++)

1349

{

1350

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1354

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1355

}

1356

1357

TensorType _target{};

1358

SimpleTensor<T> _reference{};

1359

};

1360

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1361

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1362

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

1363

{

1364

public:

1365

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1366

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

1367

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1368

{

1369

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

1378

const unsigned int m = m_w * m_h;

1379

1380

// Set the tensor shapes for LHS and RHS matrices

1381

const TensorShape lhs_shape(k, m, batch_size);

1382

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1383

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1384

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1385

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

1386

_reference = compute_reference(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1391

void fill(U &&tensor, int i)

1392

{

1393

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1394

library->fill(tensor, distribution, i);

1395

}

1396

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1397

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1398

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1399

{

1400

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1401

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1402

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1403

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1404

TensorType dst;

1405

1406

const unsigned int M = lhs_shape[1];

1407

const unsigned int N = rhs_shape[0];

1408

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1409

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1414

kernel_info.reinterpret_input_as_3d = false;

1415

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1416

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1417

1418

// The output tensor will be auto-initialized within the function

1419

1420

// Create and configure function

1421

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1422

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1423

1424

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1425

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1426

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1427

1428

// Allocate tensors

1429

lhs.allocator()->allocate();

1430

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1431

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1432

dst.allocator()->allocate();

1433

1434

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1435

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1436

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1437

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1438

1439

// Fill tensors

1440

fill(AccessorType(lhs), 0);

1441

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1442

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1450

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

1451

const ActivationLayerInfo &act_info)

giuros01