Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

48

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

49

{

50

public:

51

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

52

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

54

ARM_COMPUTE_UNUSED(pretranspose);

55

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

56

_reference = compute_reference(shape_a, shape_b, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

61

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

62

{

63

switch(tensor.data_type())

{

case DataType::F16:

case DataType::F32:

{

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

68

std::uniform_real_distribution<> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

69

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

78

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

79

{

80

// Create tensors

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

81

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

82

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

83

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

84

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

85

86

// Create and configure function

87

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

88

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

89

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

90

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

91

gemm.configure(&a,

92

&b,

93

(disable_c) ? nullptr : &c,

94

&dst,

95

alpha, beta,

96

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, (reinterpret_input_as_3d

97

|| reinterpret_output_as_3d)));

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

98

ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);

99

ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

100

ARM_COMPUTE_EXPECT(c.info()->is_resizable(), framework::LogLevel::ERRORS);

101

ARM_COMPUTE_EXPECT(dst.info()->is_resizable(), framework::LogLevel::ERRORS);

102

103

// Allocate tensors

104

a.allocator()->allocate();

105

b.allocator()->allocate();

106

c.allocator()->allocate();

107

dst.allocator()->allocate();

108

109

ARM_COMPUTE_EXPECT(!a.info()->is_resizable(), framework::LogLevel::ERRORS);

110

ARM_COMPUTE_EXPECT(!b.info()->is_resizable(), framework::LogLevel::ERRORS);

111

ARM_COMPUTE_EXPECT(!c.info()->is_resizable(), framework::LogLevel::ERRORS);

112

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

113

114

// Fill tensors

115

fill(AccessorType(a), 0);

116

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

117

if(!disable_c)

118

{

119

fill(AccessorType(c), 2);

120

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

121

122

// Compute GEMM function

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

128

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

129

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

130

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

131

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

132

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

133

if(reinterpret_input_as_3d)

134

{

135

// Collapse the second and third dimension if the input is 3D

136

shape_a_to_use.collapse(2U, 1U);

137

}

138

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

139

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

140

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

141

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

142

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

147

fill(c, 2);

148

149

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

150

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

151

const int n = shape_b[0];

152

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

153

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

154

155

// In case of broadcast, we need simply copy the first into the following "M" ones

156

for(int i = 1; i < m * batch_size; i++)

157

{

158

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

159

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

160

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

161

162

// Setting beta to 0 will effectively disable C for the

163

// computation of the reference: alpha * A * B + 0 * C

164

return reference::gemm<T>(a, b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

165

}

166

167

TensorType _target{};

168

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

169

};

170

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

171

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

172

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

173

{

174

public:

175

template <typename...>

176

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

177

DataType data_type, GPUTarget gpu_arch)

178

{

179

// Set the tensor shapes for LHS and RHS matrices

180

const TensorShape lhs_shape(k, m, batch_size);

181

const TensorShape rhs_shape(n, k, batch_size);

182

const TensorShape bias_shape(n,

183

broadcast_bias ? 1 : m,

184

broadcast_bias ? 1 : batch_size);

185

186

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

187

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

192

void fill(U &&tensor, int i)

193

{

194

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

195

library->fill(tensor, distribution, i);

196

197

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

198

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

199

library->fill_borders_with_garbage(tensor, distribution_inf, i);

200

}

201

202

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

203

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

204

{

205

// Create tensors

206

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

207

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

208

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

209

TensorType dst;

210

211

const unsigned int m = lhs_shape[1];

212

const unsigned int n = rhs_shape[0];

213

const unsigned int k = lhs_shape[0];

214

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

215

216

// The output tensor will be auto-initialized within the function

217

218

// Create and configure function

219

GEMMFunctionType gemm;

220

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

221

222

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

223

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

224

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

225

226

// Allocate tensors

227

lhs.allocator()->allocate();

228

rhs.allocator()->allocate();

229

bias.allocator()->allocate();

230

dst.allocator()->allocate();

231

232

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

233

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

234

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

235

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

236

237

// Fill tensors

238

fill(AccessorType(lhs), 0);

239

fill(AccessorType(rhs), 1);

240

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

248

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

249

const ActivationLayerInfo &act_info)

250

{

251

TensorShape dst_shape = lhs_shape;

252

dst_shape[0] = rhs_shape[0];

253

dst_shape[1] = lhs_shape[1];

254

255

// Create reference

256

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

257

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

258

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

259

260

const int n = rhs_shape[0];

261

const int m = lhs_shape[1];

262

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

272

for(int i = 1; i < m * batch_size; i++)

273

{

274

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

279

}

280

281

TensorType _target{};

282

SimpleTensor<T> _reference{};

283

};

284

285

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

286

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

287

{

288

public:

289

template <typename...>

290

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

291

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

292

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

293

ARM_COMPUTE_UNUSED(broadcast_bias);

294

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

295

// In case of GEMM3D, m is the product between m_w and m_h

296

const unsigned int m = m_w * m_h;

297

298

// Set the tensor shapes for LHS and RHS matrices

299

const TensorShape lhs_shape(k, m, batch_size);

300

const TensorShape rhs_shape(n, k, batch_size);

301

const TensorShape bias_shape(n, 1, 1);

302

303

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

304

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

309

void fill(U &&tensor, int i)

310

{

311

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

312

library->fill(tensor, distribution, i);

313

}

314

315

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

316

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

317

{

318

// Create tensors

319

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

320

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

321

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

322

TensorType dst;

323

324

const unsigned int m = lhs_shape[1];

325

const unsigned int n = rhs_shape[0];

326

const unsigned int k = lhs_shape[0];

327

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

328

329

// The output tensor will be auto-initialized within the function

330

331

// Create and configure function

332

GEMMFunctionType gemm;

333

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

334

335

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

336

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

337

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

338

339

// Allocate tensors

340

lhs.allocator()->allocate();

341

rhs.allocator()->allocate();

342

bias.allocator()->allocate();

343

dst.allocator()->allocate();

344

345

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

346

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

347

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

348

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

349

350

// Fill tensors

351

fill(AccessorType(lhs), 0);

352

fill(AccessorType(rhs), 1);

353

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

361

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

362

const ActivationLayerInfo &act_info)

363

{

364

TensorShape dst_shape = lhs_shape;

365

dst_shape.set(0, rhs_shape[0]);

366

dst_shape.set(1, lhs_shape[1] / m_h);

367

dst_shape.set(2, m_h);

368

dst_shape.set(3, lhs_shape[2]);

369

370

// Create reference

371

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

372

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

373

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

374

375

const int n = rhs_shape[0];

376

const int m = lhs_shape[1];

377

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

385

for(int i = 1; i < m * batch_size; i++)

386

{

387

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

388

}

389

390

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

391

}

392

393

TensorType _target{};

394

SimpleTensor<T> _reference{};

395

};

396

397

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

398

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

399

{

400

public:

401

template <typename...>

402

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

403

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

404

{

405

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

410

lhs_info.transpose = true;

411

412

GEMMRHSMatrixInfo rhs_info;

413

rhs_info.n0 = 16 / sizeof(T);

414

rhs_info.k0 = 1;

415

rhs_info.h0 = h0;

416

rhs_info.interleave = false;

417

rhs_info.transpose = false;

418

419

// Set the tensor shapes for LHS and RHS matrices

420

const TensorShape lhs_shape(k, m, batch_size);

421

const TensorShape rhs_shape(n, k, batch_size);

422

const TensorShape bias_shape(n,

423

broadcast_bias ? 1 : m,

424

broadcast_bias ? 1 : batch_size);

425

426

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

427

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

432

void fill(U &&tensor, int i)

433

{

434

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

435

library->fill(tensor, distribution, i);

436

437

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

438

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

439

library->fill_borders_with_garbage(tensor, distribution_inf, i);

440

}

441

442

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

443

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

444

{

445

// Create tensors

446

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

447

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

448

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

449

TensorType lhs_reshaped;

450

TensorType rhs_reshaped;

451

TensorType dst;

452

453

const unsigned int m = lhs_shape[1];

454

const unsigned int n = rhs_shape[0];

455

const unsigned int k = lhs_shape[0];

456

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

457

458

// The output tensor will be auto-initialized within the function

459

460

// Create and configure function

461

ReshapeLHSFunctionType reshape_lhs;

462

ReshapeRHSFunctionType reshape_rhs;

463

GEMMFunctionType gemm;

464

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

465

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

466

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

467

468

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

469

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

470

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

471

472

// Allocate tensors

473

lhs.allocator()->allocate();

474

rhs.allocator()->allocate();

475

lhs_reshaped.allocator()->allocate();

476

rhs_reshaped.allocator()->allocate();

477

bias.allocator()->allocate();

478

dst.allocator()->allocate();

479

480

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

481

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

482

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

483

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

484

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

485

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

486

487

// Fill tensors

488

fill(AccessorType(lhs), 0);

489

fill(AccessorType(rhs), 1);

490

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

500

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

501

const ActivationLayerInfo &act_info)

502

{

503

TensorShape dst_shape = lhs_shape;

504

dst_shape[0] = rhs_shape[0];

505

dst_shape[1] = lhs_shape[1];

506

507

// Create reference

508

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

509

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

510

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

511

512

const int n = rhs_shape[0];

513

const int m = lhs_shape[1];

514

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

524

for(int i = 1; i < m * batch_size; i++)

525

{

526

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

531

}

532

533

TensorType _target{};

534

SimpleTensor<T> _reference{};

535

};

536

537

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

538

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

539

{

540

public:

541

template <typename...>

542

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

543

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

544

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

545

ARM_COMPUTE_UNUSED(broadcast_bias);

546

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

547

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

552

lhs_info.transpose = true;

553

554

GEMMRHSMatrixInfo rhs_info;

555

rhs_info.n0 = 16 / sizeof(T);

556

rhs_info.k0 = 1;

557

rhs_info.h0 = h0;

558

rhs_info.interleave = false;

559

rhs_info.transpose = false;

560

561

// In case of GEMM3D, m is the product between m_w and m_h

562

const unsigned int m = m_w * m_h;

563

564

// Set the tensor shapes for LHS and RHS matrices

565

const TensorShape lhs_shape(k, m, batch_size);

566

const TensorShape rhs_shape(n, k, batch_size);

567

const TensorShape bias_shape(n, 1, 1);

568

569

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

570

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

575

void fill(U &&tensor, int i)

576

{

577

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

578

library->fill(tensor, distribution, i);

579

}

580

581

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

582

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

583

{

584

// Create tensors

585

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

586

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

587

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

588

TensorType lhs_reshaped;

589

TensorType rhs_reshaped;

590

TensorType dst;

591

592

const unsigned int m = lhs_shape[1];

593

const unsigned int n = rhs_shape[0];

594

const unsigned int k = lhs_shape[0];

595

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

596

597

// The output tensor will be auto-initialized within the function

598

599

// Create and configure function

600

ReshapeLHSFunctionType reshape_lhs;

601

ReshapeRHSFunctionType reshape_rhs;

602

GEMMFunctionType gemm;

603

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

604

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

605

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

606

607

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

608

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

609

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

610

611

// Allocate tensors

612

lhs.allocator()->allocate();

613

rhs.allocator()->allocate();

614

lhs_reshaped.allocator()->allocate();

615

rhs_reshaped.allocator()->allocate();

616

bias.allocator()->allocate();

617

dst.allocator()->allocate();

618

619

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

620

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

621

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

622

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

623

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

624

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

625

626

// Fill tensors

627

fill(AccessorType(lhs), 0);

628

fill(AccessorType(rhs), 1);

629

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

639

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

640

const ActivationLayerInfo &act_info)

641

{

642

TensorShape dst_shape = lhs_shape;

643

dst_shape.set(0, rhs_shape[0]);

644

dst_shape.set(1, lhs_shape[1] / m_h);

645

dst_shape.set(2, m_h);

646

dst_shape.set(3, lhs_shape[2]);

647

648

// Create reference

649

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

650

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

651

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

652

653

const int n = rhs_shape[0];

654

const int m = lhs_shape[1];

655

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

663

for(int i = 1; i < m * batch_size; i++)

664

{

665

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

666

}

667

668

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

669

}

670

671

TensorType _target{};

672

SimpleTensor<T> _reference{};

673

};

674

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

675

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

676

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

677

{

678

public:

679

template <typename...>

680

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

681

bool interleave_rhs, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

682

{

683

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

688

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

689

690

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

695

rhs_info.transpose = !lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

696

697

// Set the tensor shapes for LHS and RHS matrices

698

const TensorShape lhs_shape(k, m, batch_size);

699

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

700

const TensorShape bias_shape(n,

701

broadcast_bias ? 1 : m,

702

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

703

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

704

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

705

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

710

void fill(U &&tensor, int i)

711

{

712

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

713

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

714

715

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

716

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

717

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

718

}

719

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

720

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

721

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

722

{

723

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

724

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

725

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

726

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

727

TensorType lhs_reshaped;

728

TensorType rhs_reshaped;

729

TensorType dst;

730

731

const unsigned int M = lhs_shape[1];

732

const unsigned int N = rhs_shape[0];

733

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

734

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

739

kernel_info.reinterpret_input_as_3d = false;

740

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

741

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

742

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

743

744

// The output tensor will be auto-initialized within the function

745

746

// Create and configure function

747

ReshapeLHSFunctionType reshape_lhs;

748

ReshapeRHSFunctionType reshape_rhs;

749

GEMMFunctionType gemm;

750

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

751

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

752

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

753

754

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

755

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

756

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

757

758

// Allocate tensors

759

lhs.allocator()->allocate();

760

rhs.allocator()->allocate();

761

lhs_reshaped.allocator()->allocate();

762

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

763

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

764

dst.allocator()->allocate();

765

766

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

767

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

768

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

769

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

770

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

771

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

772

773

// Fill tensors

774

fill(AccessorType(lhs), 0);

775

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

776

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

786

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

787

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

788

{

789

TensorShape dst_shape = lhs_shape;

790

dst_shape[0] = rhs_shape[0];

791

dst_shape[1] = lhs_shape[1];

792

793

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

794

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

795

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

796

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

797

798

const int n = rhs_shape[0];

799

const int m = lhs_shape[1];

800

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

805

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

806

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

807

if(broadcast_bias)

808

{

809

// In case of broadcast, we need simply copy the first into the following "M" ones

810

for(int i = 1; i < m * batch_size; i++)

811

{

812

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

816

if(fp_mixed_precision)

817

{

818

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

823

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

824

}

825

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

826

TensorType _target{};

827

SimpleTensor<T> _reference{};

828

};

829

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

830

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

831

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

832

{

833

public:

834

template <typename...>

835

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

836

bool interleave_lhs,

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

837

bool interleave_rhs, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

838

{

839

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

844

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

845

846

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

Giorgio Arena

2019-08-01 14:22:12 +0100

[diff] [blame]

851

rhs_info.transpose = !lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

852

853

// In case of GEMM3D, m is the product between m_w and m_h

854

const unsigned int m = m_w * m_h;

855

856

// Set the tensor shapes for LHS and RHS matrices

857

const TensorShape lhs_shape(k, m, batch_size);

858

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

859

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

860

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

861

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

862

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

867

void fill(U &&tensor, int i)

868

{

869

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

870

library->fill(tensor, distribution, i);

871

}

872

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

873

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

874

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

875

{

876

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

877

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

878

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

879

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

880

TensorType lhs_reshaped;

881

TensorType rhs_reshaped;

882

TensorType dst;

883

884

const unsigned int M = lhs_shape[1];

885

const unsigned int N = rhs_shape[0];

886

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

887

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

892

kernel_info.reinterpret_input_as_3d = false;

893

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

894

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

895

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

896

897

// The output tensor will be auto-initialized within the function

898

899

// Create and configure function

900

ReshapeLHSFunctionType reshape_lhs;

901

ReshapeRHSFunctionType reshape_rhs;

902

GEMMFunctionType gemm;

903

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

904

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

905

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

906

907

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

908

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

909

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

910

911

// Allocate tensors

912

lhs.allocator()->allocate();

913

rhs.allocator()->allocate();

914

lhs_reshaped.allocator()->allocate();

915

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

916

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

917

dst.allocator()->allocate();

918

919

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

920

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

921

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

922

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

923

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

924

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

925

926

// Fill tensors

927

fill(AccessorType(lhs), 0);

928

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

929

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

939

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

940

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

941

{

942

TensorShape dst_shape = lhs_shape;

943

dst_shape.set(0, rhs_shape[0]);

944

dst_shape.set(1, lhs_shape[1] / m_h);

945

dst_shape.set(2, m_h);

946

dst_shape.set(3, lhs_shape[2]);

947

948

// Create reference

949

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

950

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

951

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

952

953

const int n = rhs_shape[0];

954

const int m = lhs_shape[1];

955

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

960

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

961

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

962

// In case of broadcast, we need simply copy the first into the following "M" ones

963

for(int i = 1; i < m * batch_size; i++)

964

{

965

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

966

}

967

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

968

if(fp_mixed_precision)

969

{

970

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

975

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

976

}

977

978

TensorType _target{};

979

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

980

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

981

982

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

983

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

984

{

985

public:

986

template <typename...>

987

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

988

bool interleave_rhs, bool transpose_rhs, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

989

{

990

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

999

rhs_info.transpose = transpose_rhs;

1000

1001

// Set the tensor shapes for LHS and RHS matrices

1002

const TensorShape lhs_shape(k, m, batch_size);

1003

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1004

const TensorShape bias_shape(n,

1005

broadcast_bias ? 1 : m,

1006

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1007

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1008

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

1009

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1014

void fill(U &&tensor, int i)

1015

{

1016

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1017

library->fill(tensor, distribution, i);

1018

1019

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1020

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1021

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1022

}

1023

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1024

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1025

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1026

{

1027

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1028

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1029

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1030

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1031

TensorType rhs_reshaped;

1032

TensorType dst;

1033

1034

const unsigned int M = lhs_shape[1];

1035

const unsigned int N = rhs_shape[0];

1036

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1037

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1042

kernel_info.reinterpret_input_as_3d = false;

1043

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1044

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1045

1046

// The output tensor will be auto-initialized within the function

1047

1048

// Create and configure function

1049

ReshapeRHSFunctionType reshape_rhs;

1050

GEMMFunctionType gemm;

1051

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1052

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1053

1054

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1055

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1056

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1057

1058

// Allocate tensors

1059

lhs.allocator()->allocate();

1060

rhs.allocator()->allocate();

1061

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1062

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1063

dst.allocator()->allocate();

1064

1065

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1066

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1067

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1068

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1069

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1070

1071

// Fill tensors

1072

fill(AccessorType(lhs), 0);

1073

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1074

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

1083

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1084

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1085

{

1086

TensorShape dst_shape = lhs_shape;

1087

dst_shape[0] = rhs_shape[0];

1088

dst_shape[1] = lhs_shape[1];

1089

1090

// Create reference

1091

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1092

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1093

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1094

1095

const int n = rhs_shape[0];

1096

const int m = lhs_shape[1];

1097

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1102

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1103

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1104

if(broadcast_bias)

1105

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1106

// In case of broadcast, we need simply copy the first into the following "M" ones

1107

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1108

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1109

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1110

}

1111

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1112

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1113

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1114

}

1115

1116

TensorType _target{};

1117

SimpleTensor<T> _reference{};

1118

};

1119

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1120

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

1121

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1122

{

1123

public:

1124

template <typename...>

1125

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1126

bool interleave_rhs, bool transpose_rhs, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1127

{

1128

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1137

rhs_info.transpose = transpose_rhs;

1138

1139

// In case of GEMM3D, m is the product between m_w and m_h

1140

const unsigned int m = m_w * m_h;

1141

1142

// Set the tensor shapes for LHS and RHS matrices

1143

const TensorShape lhs_shape(k, m, batch_size);

1144

const TensorShape rhs_shape(n, k, batch_size);

1145

const TensorShape bias_shape(n, 1, 1);

1146

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1147

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

1148

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1153

void fill(U &&tensor, int i)

1154

{

1155

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1156

library->fill(tensor, distribution, i);

1157

}

1158

1159

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1160

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1161

unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1162

{

1163

// Create tensors

1164

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1165

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1166

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1167

TensorType rhs_reshaped;

1168

TensorType dst;

1169

1170

const unsigned int M = lhs_shape[1];

1171

const unsigned int N = rhs_shape[0];

1172

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1173

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1178

kernel_info.reinterpret_input_as_3d = false;

1179

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1180

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1181

1182

// The output tensor will be auto-initialized within the function

1183

1184

// Create and configure function

1185

ReshapeRHSFunctionType reshape_rhs;

1186

GEMMFunctionType gemm;

1187

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1188

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1189

1190

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1191

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1192

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1193

1194

// Allocate tensors

1195

lhs.allocator()->allocate();

1196

rhs.allocator()->allocate();

1197

rhs_reshaped.allocator()->allocate();

1198

bias.allocator()->allocate();

1199

dst.allocator()->allocate();

1200

1201

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1202

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1203

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

1204

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1205

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1206

1207

// Fill tensors

1208

fill(AccessorType(lhs), 0);

1209

fill(AccessorType(rhs), 1);

1210

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

1219

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1220

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1221

{

1222

TensorShape dst_shape = lhs_shape;

1223

dst_shape.set(0, rhs_shape[0]);

1224

dst_shape.set(1, lhs_shape[1] / m_h);

1225

dst_shape.set(2, m_h);

1226

dst_shape.set(3, lhs_shape[2]);

1227

1228

// Create reference

1229

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1230

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1231

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1232

1233

const int n = rhs_shape[0];

1234

const int m = lhs_shape[1];

1235

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

1243

for(int i = 1; i < m * batch_size; i++)

1244

{

1245

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1246

}

1247

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1248

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1249

}

1250

1251

TensorType _target{};

1252

SimpleTensor<T> _reference{};

1253

};

1254

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1255

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1256

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1257

{

1258

public:

1259

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1260

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1261

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1262

{

1263

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1272

const TensorShape lhs_shape(k, m, batch_size);

1273

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1274

const TensorShape bias_shape(n,

1275

broadcast_bias ? 1 : m,

1276

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1277

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1278

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

1279

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1284

void fill(U &&tensor, int i)

1285

{

1286

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1287

library->fill(tensor, distribution, i);

1288

1289

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1290

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1291

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1292

}

1293

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1294

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1295

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1296

{

1297

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1298

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1299

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1300

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1301

TensorType dst;

1302

1303

const unsigned int M = lhs_shape[1];

1304

const unsigned int N = rhs_shape[0];

1305

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1306

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1311

kernel_info.reinterpret_input_as_3d = false;

1312

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1313

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1314

1315

// Create and configure function

1316

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1317

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1318

1319

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1320

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1321

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1322

1323

// Allocate tensors

1324

lhs.allocator()->allocate();

1325

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1326

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1327

dst.allocator()->allocate();

1328

1329

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1330

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1331

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1332

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1333

1334

// Fill tensors

1335

fill(AccessorType(lhs), 0);

1336

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1337

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

1345

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1346

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1347

{

1348

TensorShape dst_shape = lhs_shape;

1349

dst_shape[0] = rhs_shape[0];

1350

dst_shape[1] = lhs_shape[1];

1351

1352

// Create reference

1353

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1354

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1355

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1356

1357

const int n = rhs_shape[0];

1358

const int m = lhs_shape[1];

1359

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1364

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1365

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1366

if(broadcast_bias)

1367

{

1368

// In case of broadcast, we need simply copy the first into the following "M" ones

1369

for(int i = 1; i < m * batch_size; i++)

1370

{

1371

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1375

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1376

}

1377

1378

TensorType _target{};

1379

SimpleTensor<T> _reference{};

1380

};

1381

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1382

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1383

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

1384

{

1385

public:

1386

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1387

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

1388

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1389

{

1390

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

1399

const unsigned int m = m_w * m_h;

1400

1401

// Set the tensor shapes for LHS and RHS matrices

1402

const TensorShape lhs_shape(k, m, batch_size);

1403

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1404

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1405

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1406

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

1407

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1412

void fill(U &&tensor, int i)

1413

{

1414

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1415

library->fill(tensor, distribution, i);

1416

}

1417

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1418

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1419

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1420

{

1421

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1422

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1423

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1424

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1425

TensorType dst;

1426

1427

const unsigned int M = lhs_shape[1];

1428

const unsigned int N = rhs_shape[0];

1429

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1430

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1435

kernel_info.reinterpret_input_as_3d = false;

1436

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1437

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1438

1439

// The output tensor will be auto-initialized within the function

1440

1441

// Create and configure function

1442

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1443

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1444

1445

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1446

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1447

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1448

1449

// Allocate tensors

1450

lhs.allocator()->allocate();

1451

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1452

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1453

dst.allocator()->allocate();

1454

1455

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1456

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1457

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1458

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1459

1460

// Fill tensors

1461

fill(AccessorType(lhs), 0);

1462

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1463

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame^]

1471

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1472

const ActivationLayerInfo &act_info)

giuros01