Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

48

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

49

{

50

public:

51

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

52

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

54

ARM_COMPUTE_UNUSED(pretranspose);

55

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

56

_reference = compute_reference(shape_a, shape_b, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

61

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

62

{

63

switch(tensor.data_type())

64

{

65

case DataType::F16:

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

66

{

Giorgio Arena

b309fc2

2021-01-05 09:46:16 +0000

[diff] [blame^]

67

arm_compute::utils::uniform_real_distribution_fp16 distribution{ float(lo), float(hi) };

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

68

library->fill(tensor, distribution, i);

69

break;

70

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

71

case DataType::F32:

72

{

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

73

std::uniform_real_distribution<float> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

74

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

83

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

84

{

85

// Create tensors

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

86

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

87

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

88

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

89

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

90

91

// Create and configure function

92

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

93

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

94

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

95

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

96

gemm.configure(&a,

97

&b,

98

(disable_c) ? nullptr : &c,

99

&dst,

100

alpha, beta,

101

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, (reinterpret_input_as_3d

102

|| reinterpret_output_as_3d)));

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

103

ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);

104

ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

105

ARM_COMPUTE_EXPECT(c.info()->is_resizable(), framework::LogLevel::ERRORS);

106

ARM_COMPUTE_EXPECT(dst.info()->is_resizable(), framework::LogLevel::ERRORS);

107

108

// Allocate tensors

109

a.allocator()->allocate();

110

b.allocator()->allocate();

111

c.allocator()->allocate();

112

dst.allocator()->allocate();

113

114

ARM_COMPUTE_EXPECT(!a.info()->is_resizable(), framework::LogLevel::ERRORS);

115

ARM_COMPUTE_EXPECT(!b.info()->is_resizable(), framework::LogLevel::ERRORS);

116

ARM_COMPUTE_EXPECT(!c.info()->is_resizable(), framework::LogLevel::ERRORS);

117

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

118

119

// Fill tensors

120

fill(AccessorType(a), 0);

121

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

122

if(!disable_c)

123

{

124

fill(AccessorType(c), 2);

125

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

126

127

// Compute GEMM function

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

133

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

134

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

135

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

136

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

137

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

138

if(reinterpret_input_as_3d)

139

{

140

// Collapse the second and third dimension if the input is 3D

141

shape_a_to_use.collapse(2U, 1U);

142

}

143

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

144

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

145

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

146

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

147

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

152

fill(c, 2);

153

154

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

155

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

156

const int n = shape_b[0];

157

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

158

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

159

160

// In case of broadcast, we need simply copy the first into the following "M" ones

161

for(int i = 1; i < m * batch_size; i++)

162

{

163

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

164

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

165

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

166

167

// Setting beta to 0 will effectively disable C for the

168

// computation of the reference: alpha * A * B + 0 * C

169

return reference::gemm<T>(a, b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

170

}

171

172

TensorType _target{};

173

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

174

};

175

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

176

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

177

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

178

{

179

public:

180

template <typename...>

181

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

182

DataType data_type, GPUTarget gpu_arch)

183

{

184

// Set the tensor shapes for LHS and RHS matrices

185

const TensorShape lhs_shape(k, m, batch_size);

186

const TensorShape rhs_shape(n, k, batch_size);

187

const TensorShape bias_shape(n,

188

broadcast_bias ? 1 : m,

189

broadcast_bias ? 1 : batch_size);

190

191

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

192

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

197

void fill(U &&tensor, int i)

198

{

199

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

200

library->fill(tensor, distribution, i);

201

202

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

203

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

204

library->fill_borders_with_garbage(tensor, distribution_inf, i);

205

}

206

207

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

208

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

209

{

210

// Create tensors

211

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

212

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

213

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

214

TensorType dst;

215

216

const unsigned int m = lhs_shape[1];

217

const unsigned int n = rhs_shape[0];

218

const unsigned int k = lhs_shape[0];

219

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

220

221

// The output tensor will be auto-initialized within the function

222

223

// Create and configure function

224

GEMMFunctionType gemm;

225

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

226

227

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

228

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

229

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

230

231

// Allocate tensors

232

lhs.allocator()->allocate();

233

rhs.allocator()->allocate();

234

bias.allocator()->allocate();

235

dst.allocator()->allocate();

236

237

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

238

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

239

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

240

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

241

242

// Fill tensors

243

fill(AccessorType(lhs), 0);

244

fill(AccessorType(rhs), 1);

245

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

253

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

254

const ActivationLayerInfo &act_info)

255

{

256

TensorShape dst_shape = lhs_shape;

257

dst_shape[0] = rhs_shape[0];

258

dst_shape[1] = lhs_shape[1];

259

260

// Create reference

261

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

262

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

263

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

264

265

const int n = rhs_shape[0];

266

const int m = lhs_shape[1];

267

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

277

for(int i = 1; i < m * batch_size; i++)

278

{

279

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

284

}

285

286

TensorType _target{};

287

SimpleTensor<T> _reference{};

288

};

289

290

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

291

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

292

{

293

public:

294

template <typename...>

295

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

296

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

297

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

298

ARM_COMPUTE_UNUSED(broadcast_bias);

299

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

300

// In case of GEMM3D, m is the product between m_w and m_h

301

const unsigned int m = m_w * m_h;

302

303

// Set the tensor shapes for LHS and RHS matrices

304

const TensorShape lhs_shape(k, m, batch_size);

305

const TensorShape rhs_shape(n, k, batch_size);

306

const TensorShape bias_shape(n, 1, 1);

307

308

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

309

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

314

void fill(U &&tensor, int i)

315

{

316

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

317

library->fill(tensor, distribution, i);

318

}

319

320

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

321

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

322

{

323

// Create tensors

324

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

325

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

326

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

327

TensorType dst;

328

329

const unsigned int m = lhs_shape[1];

330

const unsigned int n = rhs_shape[0];

331

const unsigned int k = lhs_shape[0];

332

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

333

334

// The output tensor will be auto-initialized within the function

335

336

// Create and configure function

337

GEMMFunctionType gemm;

338

gemm.configure(gpu_arch, &lhs, &rhs, &bias, &dst, alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

339

340

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

341

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

342

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

343

344

// Allocate tensors

345

lhs.allocator()->allocate();

346

rhs.allocator()->allocate();

347

bias.allocator()->allocate();

348

dst.allocator()->allocate();

349

350

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

351

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

352

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

353

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

354

355

// Fill tensors

356

fill(AccessorType(lhs), 0);

357

fill(AccessorType(rhs), 1);

358

fill(AccessorType(bias), 2);

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

366

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

367

const ActivationLayerInfo &act_info)

368

{

369

TensorShape dst_shape = lhs_shape;

370

dst_shape.set(0, rhs_shape[0]);

371

dst_shape.set(1, lhs_shape[1] / m_h);

372

dst_shape.set(2, m_h);

373

dst_shape.set(3, lhs_shape[2]);

374

375

// Create reference

376

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

377

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

378

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

379

380

const int n = rhs_shape[0];

381

const int m = lhs_shape[1];

382

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

390

for(int i = 1; i < m * batch_size; i++)

391

{

392

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

393

}

394

395

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

396

}

397

398

TensorType _target{};

399

SimpleTensor<T> _reference{};

400

};

401

402

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

403

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

404

{

405

public:

406

template <typename...>

407

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

408

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

409

{

410

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

415

lhs_info.transpose = true;

416

417

GEMMRHSMatrixInfo rhs_info;

418

rhs_info.n0 = 16 / sizeof(T);

419

rhs_info.k0 = 1;

420

rhs_info.h0 = h0;

421

rhs_info.interleave = false;

422

rhs_info.transpose = false;

423

424

// Set the tensor shapes for LHS and RHS matrices

425

const TensorShape lhs_shape(k, m, batch_size);

426

const TensorShape rhs_shape(n, k, batch_size);

427

const TensorShape bias_shape(n,

428

broadcast_bias ? 1 : m,

429

broadcast_bias ? 1 : batch_size);

430

431

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

432

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

437

void fill(U &&tensor, int i)

438

{

439

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

440

library->fill(tensor, distribution, i);

441

442

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

443

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

444

library->fill_borders_with_garbage(tensor, distribution_inf, i);

445

}

446

447

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

448

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

449

{

450

// Create tensors

451

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

452

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

453

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

454

TensorType lhs_reshaped;

455

TensorType rhs_reshaped;

456

TensorType dst;

457

458

const unsigned int m = lhs_shape[1];

459

const unsigned int n = rhs_shape[0];

460

const unsigned int k = lhs_shape[0];

461

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

462

463

// The output tensor will be auto-initialized within the function

464

465

// Create and configure function

466

ReshapeLHSFunctionType reshape_lhs;

467

ReshapeRHSFunctionType reshape_rhs;

468

GEMMFunctionType gemm;

469

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

470

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

471

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

472

473

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

474

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

475

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

476

477

// Allocate tensors

478

lhs.allocator()->allocate();

479

rhs.allocator()->allocate();

480

lhs_reshaped.allocator()->allocate();

481

rhs_reshaped.allocator()->allocate();

482

bias.allocator()->allocate();

483

dst.allocator()->allocate();

484

485

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

486

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

487

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

488

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

489

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

490

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

491

492

// Fill tensors

493

fill(AccessorType(lhs), 0);

494

fill(AccessorType(rhs), 1);

495

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

505

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

506

const ActivationLayerInfo &act_info)

507

{

508

TensorShape dst_shape = lhs_shape;

509

dst_shape[0] = rhs_shape[0];

510

dst_shape[1] = lhs_shape[1];

511

512

// Create reference

513

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

514

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

515

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

516

517

const int n = rhs_shape[0];

518

const int m = lhs_shape[1];

519

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

529

for(int i = 1; i < m * batch_size; i++)

530

{

531

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

536

}

537

538

TensorType _target{};

539

SimpleTensor<T> _reference{};

540

};

541

542

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

543

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

544

{

545

public:

546

template <typename...>

547

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

548

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

549

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

550

ARM_COMPUTE_UNUSED(broadcast_bias);

551

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

552

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

557

lhs_info.transpose = true;

558

559

GEMMRHSMatrixInfo rhs_info;

560

rhs_info.n0 = 16 / sizeof(T);

561

rhs_info.k0 = 1;

562

rhs_info.h0 = h0;

563

rhs_info.interleave = false;

564

rhs_info.transpose = false;

565

566

// In case of GEMM3D, m is the product between m_w and m_h

567

const unsigned int m = m_w * m_h;

568

569

// Set the tensor shapes for LHS and RHS matrices

570

const TensorShape lhs_shape(k, m, batch_size);

571

const TensorShape rhs_shape(n, k, batch_size);

572

const TensorShape bias_shape(n, 1, 1);

573

574

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

575

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

580

void fill(U &&tensor, int i)

581

{

582

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

583

library->fill(tensor, distribution, i);

584

}

585

586

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

587

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

588

{

589

// Create tensors

590

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

591

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

592

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

593

TensorType lhs_reshaped;

594

TensorType rhs_reshaped;

595

TensorType dst;

596

597

const unsigned int m = lhs_shape[1];

598

const unsigned int n = rhs_shape[0];

599

const unsigned int k = lhs_shape[0];

600

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

601

602

// The output tensor will be auto-initialized within the function

603

604

// Create and configure function

605

ReshapeLHSFunctionType reshape_lhs;

606

ReshapeRHSFunctionType reshape_rhs;

607

GEMMFunctionType gemm;

608

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

609

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

610

gemm.configure(gpu_arch, &lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

611

612

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

613

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

614

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

615

616

// Allocate tensors

617

lhs.allocator()->allocate();

618

rhs.allocator()->allocate();

619

lhs_reshaped.allocator()->allocate();

620

rhs_reshaped.allocator()->allocate();

621

bias.allocator()->allocate();

622

dst.allocator()->allocate();

623

624

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

625

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

626

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

627

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

628

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

629

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

630

631

// Fill tensors

632

fill(AccessorType(lhs), 0);

633

fill(AccessorType(rhs), 1);

634

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

644

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

645

const ActivationLayerInfo &act_info)

646

{

647

TensorShape dst_shape = lhs_shape;

648

dst_shape.set(0, rhs_shape[0]);

649

dst_shape.set(1, lhs_shape[1] / m_h);

650

dst_shape.set(2, m_h);

651

dst_shape.set(3, lhs_shape[2]);

652

653

// Create reference

654

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

655

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

656

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

657

658

const int n = rhs_shape[0];

659

const int m = lhs_shape[1];

660

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

668

for(int i = 1; i < m * batch_size; i++)

669

{

670

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

671

}

672

673

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

674

}

675

676

TensorType _target{};

677

SimpleTensor<T> _reference{};

678

};

679

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

680

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

681

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

682

{

683

public:

684

template <typename...>

685

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

686

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

687

{

688

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

693

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

694

695

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

700

rhs_info.transpose = !lhs_transpose;

701

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

702

703

// Set the tensor shapes for LHS and RHS matrices

704

const TensorShape lhs_shape(k, m, batch_size);

705

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

706

const TensorShape bias_shape(n,

707

broadcast_bias ? 1 : m,

708

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

709

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

710

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

711

if(validate_result)

712

{

713

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

714

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

719

void fill(U &&tensor, int i)

720

{

721

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

722

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

723

724

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

725

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

726

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

727

}

728

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

729

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

730

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

731

{

732

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

733

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

734

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

735

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

736

TensorType lhs_reshaped;

737

TensorType rhs_reshaped;

738

TensorType dst;

739

740

const unsigned int M = lhs_shape[1];

741

const unsigned int N = rhs_shape[0];

742

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

743

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

748

kernel_info.reinterpret_input_as_3d = false;

749

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

750

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

751

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

752

753

// The output tensor will be auto-initialized within the function

754

755

// Create and configure function

756

ReshapeLHSFunctionType reshape_lhs;

757

ReshapeRHSFunctionType reshape_rhs;

758

GEMMFunctionType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

759

760

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

761

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

767

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

768

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

769

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

770

771

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

772

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

773

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

774

775

// Allocate tensors

776

lhs.allocator()->allocate();

777

rhs.allocator()->allocate();

778

lhs_reshaped.allocator()->allocate();

779

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

780

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

781

dst.allocator()->allocate();

782

783

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

784

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

785

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

786

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

787

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

788

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

789

790

// Fill tensors

791

fill(AccessorType(lhs), 0);

792

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

793

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

803

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

804

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

805

{

806

TensorShape dst_shape = lhs_shape;

807

dst_shape[0] = rhs_shape[0];

808

dst_shape[1] = lhs_shape[1];

809

810

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

811

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

812

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

813

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

814

815

const int n = rhs_shape[0];

816

const int m = lhs_shape[1];

817

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

822

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

823

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

824

if(broadcast_bias)

825

{

826

// In case of broadcast, we need simply copy the first into the following "M" ones

827

for(int i = 1; i < m * batch_size; i++)

828

{

829

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

833

if(fp_mixed_precision)

834

{

835

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

840

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

841

}

842

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

843

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

844

TensorType _target{};

845

SimpleTensor<T> _reference{};

846

};

847

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

848

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSFunctionType, typename ReshapeRHSFunctionType, typename GEMMFunctionType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

849

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

850

{

851

public:

852

template <typename...>

853

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

854

bool interleave_lhs, bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

855

{

856

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

861

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

862

863

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

868

rhs_info.transpose = !lhs_transpose;

869

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

870

871

// In case of GEMM3D, m is the product between m_w and m_h

872

const unsigned int m = m_w * m_h;

873

874

// Set the tensor shapes for LHS and RHS matrices

875

const TensorShape lhs_shape(k, m, batch_size);

876

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

877

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

878

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

879

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

880

if(validate_result)

881

{

882

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

883

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

888

void fill(U &&tensor, int i)

889

{

890

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

891

library->fill(tensor, distribution, i);

892

}

893

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

894

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

895

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

896

{

897

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

898

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

899

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

900

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

901

TensorType lhs_reshaped;

902

TensorType rhs_reshaped;

903

TensorType dst;

904

905

const unsigned int M = lhs_shape[1];

906

const unsigned int N = rhs_shape[0];

907

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

908

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

913

kernel_info.reinterpret_input_as_3d = false;

914

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

915

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

916

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

917

918

// The output tensor will be auto-initialized within the function

919

920

// Create and configure function

921

ReshapeLHSFunctionType reshape_lhs;

922

ReshapeRHSFunctionType reshape_rhs;

923

GEMMFunctionType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

924

925

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

926

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

932

reshape_lhs.configure(&lhs, &lhs_reshaped, lhs_info);

933

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

934

gemm.configure(&lhs_reshaped, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

935

936

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

937

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

938

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

939

940

// Allocate tensors

941

lhs.allocator()->allocate();

942

rhs.allocator()->allocate();

943

lhs_reshaped.allocator()->allocate();

944

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

945

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

946

dst.allocator()->allocate();

947

948

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

949

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

950

ARM_COMPUTE_EXPECT(!lhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

951

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

952

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

953

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

954

955

// Fill tensors

956

fill(AccessorType(lhs), 0);

957

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

958

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Compute GEMM

reshape_lhs.run();

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

968

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

969

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

970

{

971

TensorShape dst_shape = lhs_shape;

972

dst_shape.set(0, rhs_shape[0]);

973

dst_shape.set(1, lhs_shape[1] / m_h);

974

dst_shape.set(2, m_h);

975

dst_shape.set(3, lhs_shape[2]);

976

977

// Create reference

978

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

979

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

980

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

981

982

const int n = rhs_shape[0];

983

const int m = lhs_shape[1];

984

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

989

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

990

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

991

// In case of broadcast, we need simply copy the first into the following "M" ones

992

for(int i = 1; i < m * batch_size; i++)

993

{

994

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

995

}

996

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

997

if(fp_mixed_precision)

998

{

999

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

1004

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1005

}

1006

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1007

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1008

TensorType _target{};

1009

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

1010

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1011

1012

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

1013

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1014

{

1015

public:

1016

template <typename...>

1017

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

1018

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1019

{

1020

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1029

rhs_info.transpose = transpose_rhs;

1030

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1031

1032

// Set the tensor shapes for LHS and RHS matrices

1033

const TensorShape lhs_shape(k, m, batch_size);

1034

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1035

const TensorShape bias_shape(n,

1036

broadcast_bias ? 1 : m,

1037

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1038

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1039

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1040

if(validate_result)

1041

{

1042

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

1043

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1048

void fill(U &&tensor, int i)

1049

{

1050

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1051

library->fill(tensor, distribution, i);

1052

1053

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1054

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1055

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1056

}

1057

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1058

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1059

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1060

{

1061

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1062

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1063

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1064

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1065

TensorType rhs_reshaped;

1066

TensorType dst;

1067

1068

const unsigned int M = lhs_shape[1];

1069

const unsigned int N = rhs_shape[0];

1070

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1071

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1076

kernel_info.reinterpret_input_as_3d = false;

1077

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1078

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1079

1080

// The output tensor will be auto-initialized within the function

1081

1082

// Create and configure function

1083

ReshapeRHSFunctionType reshape_rhs;

1084

GEMMFunctionType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1085

1086

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1087

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1093

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1094

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1095

1096

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1097

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1098

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1099

1100

// Allocate tensors

1101

lhs.allocator()->allocate();

1102

rhs.allocator()->allocate();

1103

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1104

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1105

dst.allocator()->allocate();

1106

1107

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1108

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1109

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1110

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1111

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1112

1113

// Fill tensors

1114

fill(AccessorType(lhs), 0);

1115

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1116

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1125

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1126

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1127

{

1128

TensorShape dst_shape = lhs_shape;

1129

dst_shape[0] = rhs_shape[0];

1130

dst_shape[1] = lhs_shape[1];

1131

1132

// Create reference

1133

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1134

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1135

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1136

1137

const int n = rhs_shape[0];

1138

const int m = lhs_shape[1];

1139

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1144

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1145

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1146

if(broadcast_bias)

1147

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1148

// In case of broadcast, we need simply copy the first into the following "M" ones

1149

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1150

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1151

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1152

}

1153

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1154

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1155

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1156

}

1157

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1158

bool validate_result = true;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1159

TensorType _target{};

1160

SimpleTensor<T> _reference{};

1161

};

1162

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1163

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSFunctionType, typename GEMMFunctionType>

1164

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1165

{

1166

public:

1167

template <typename...>

1168

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1169

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, bool has_pad_y, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1170

{

1171

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1180

rhs_info.transpose = transpose_rhs;

1181

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1182

1183

// In case of GEMM3D, m is the product between m_w and m_h

1184

const unsigned int m = m_w * m_h;

1185

1186

// Set the tensor shapes for LHS and RHS matrices

1187

const TensorShape lhs_shape(k, m, batch_size);

1188

const TensorShape rhs_shape(n, k, batch_size);

1189

const TensorShape bias_shape(n, 1, 1);

1190

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1191

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info, has_pad_y);

1192

if(validate_result)

1193

{

1194

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1195

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1200

void fill(U &&tensor, int i)

1201

{

1202

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1203

library->fill(tensor, distribution, i);

1204

}

1205

1206

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1207

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1208

unsigned int m_h, const ActivationLayerInfo &act_info, bool has_pad_y)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1209

{

1210

// Create tensors

1211

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1212

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1213

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1214

TensorType rhs_reshaped;

1215

TensorType dst;

1216

1217

const unsigned int M = lhs_shape[1];

1218

const unsigned int N = rhs_shape[0];

1219

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1220

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1225

kernel_info.reinterpret_input_as_3d = false;

1226

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1227

kernel_info.activation_info = act_info;

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1228

kernel_info.has_pad_y = has_pad_y;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1229

1230

// The output tensor will be auto-initialized within the function

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1231

// Create and configure function

1232

ReshapeRHSFunctionType reshape_rhs;

1233

GEMMFunctionType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1234

1235

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1236

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1242

reshape_rhs.configure(&rhs, &rhs_reshaped, rhs_info);

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1243

gemm.configure(&lhs, &rhs_reshaped, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1244

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1245

if(has_pad_y)

1246

{

1247

// Add dummy padding into lhs to validate has_pad_y path

1248

lhs.info()->extend_padding(PaddingSize(2, 0, 2, 0));

1249

dst.info()->extend_padding(PaddingSize(2, 0, 1, 0));

1250

}

1251

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1252

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1253

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1254

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1255

1256

// Allocate tensors

1257

lhs.allocator()->allocate();

1258

rhs.allocator()->allocate();

1259

rhs_reshaped.allocator()->allocate();

1260

bias.allocator()->allocate();

1261

dst.allocator()->allocate();

1262

1263

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1264

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1265

ARM_COMPUTE_EXPECT(!rhs_reshaped.info()->is_resizable(), framework::LogLevel::ERRORS);

1266

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

1267

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1268

1269

// Fill tensors

1270

fill(AccessorType(lhs), 0);

1271

fill(AccessorType(rhs), 1);

1272

fill(AccessorType(bias), 2);

// Compute GEMM

reshape_rhs.run();

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1281

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1282

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1283

{

1284

TensorShape dst_shape = lhs_shape;

1285

dst_shape.set(0, rhs_shape[0]);

1286

dst_shape.set(1, lhs_shape[1] / m_h);

1287

dst_shape.set(2, m_h);

1288

dst_shape.set(3, lhs_shape[2]);

1289

1290

// Create reference

1291

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1292

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1293

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1294

1295

const int n = rhs_shape[0];

1296

const int m = lhs_shape[1];

1297

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

1305

for(int i = 1; i < m * batch_size; i++)

1306

{

1307

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1308

}

1309

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1310

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1311

}

1312

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1313

bool validate_result = true;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1314

TensorType _target{};

1315

SimpleTensor<T> _reference{};

1316

};

1317

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1318

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1319

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1320

{

1321

public:

1322

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1323

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1324

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1325

{

1326

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1335

const TensorShape lhs_shape(k, m, batch_size);

1336

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1337

const TensorShape bias_shape(n,

1338

broadcast_bias ? 1 : m,

1339

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1340

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1341

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1342

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1347

void fill(U &&tensor, int i)

1348

{

1349

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1350

library->fill(tensor, distribution, i);

1351

1352

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1353

std::uniform_real_distribution<> distribution_inf(std::numeric_limits<float>::infinity(), std::numeric_limits<float>::infinity());

1354

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1355

}

1356

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1357

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1358

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1359

{

1360

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1361

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1362

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1363

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1364

TensorType dst;

1365

1366

const unsigned int M = lhs_shape[1];

1367

const unsigned int N = rhs_shape[0];

1368

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1369

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1374

kernel_info.reinterpret_input_as_3d = false;

1375

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1376

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1377

1378

// Create and configure function

1379

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1380

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1381

1382

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1383

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1384

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1385

1386

// Allocate tensors

1387

lhs.allocator()->allocate();

1388

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1389

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1390

dst.allocator()->allocate();

1391

1392

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1393

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1394

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1395

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1396

1397

// Fill tensors

1398

fill(AccessorType(lhs), 0);

1399

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1400

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1408

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1409

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1410

{

1411

TensorShape dst_shape = lhs_shape;

1412

dst_shape[0] = rhs_shape[0];

1413

dst_shape[1] = lhs_shape[1];

1414

1415

// Create reference

1416

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1417

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1418

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1419

1420

const int n = rhs_shape[0];

1421

const int m = lhs_shape[1];

1422

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1427

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1428

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1429

if(broadcast_bias)

1430

{

1431

// In case of broadcast, we need simply copy the first into the following "M" ones

1432

for(int i = 1; i < m * batch_size; i++)

1433

{

1434

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1438

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1439

}

1440

1441

TensorType _target{};

1442

SimpleTensor<T> _reference{};

1443

};

1444

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1445

template <typename TensorType, typename AccessorType, typename T, typename GEMMFunctionType>

1446

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

1447

{

1448

public:

1449

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1450

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

1451

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1452

{

1453

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

1462

const unsigned int m = m_w * m_h;

1463

1464

// Set the tensor shapes for LHS and RHS matrices

1465

const TensorShape lhs_shape(k, m, batch_size);

1466

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1467

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1468

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1469

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1470

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1475

void fill(U &&tensor, int i)

1476

{

1477

std::uniform_real_distribution<> distribution(-1.0f, 1.0f);

1478

library->fill(tensor, distribution, i);

1479

}

1480

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1481

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1482

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1483

{

1484

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1485

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1486

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1487

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1488

TensorType dst;

1489

1490

const unsigned int M = lhs_shape[1];

1491

const unsigned int N = rhs_shape[0];

1492

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1493

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1498

kernel_info.reinterpret_input_as_3d = false;

1499

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1500

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1501

1502

// The output tensor will be auto-initialized within the function

1503

1504

// Create and configure function

1505

GEMMFunctionType gemm;

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1506

gemm.configure(&lhs, &rhs, &bias, &dst, alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1507

1508

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1509

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1510

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1511

1512

// Allocate tensors

1513

lhs.allocator()->allocate();

1514

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1515

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1516

dst.allocator()->allocate();

1517

1518

ARM_COMPUTE_EXPECT(!lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

1519

ARM_COMPUTE_EXPECT(!rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1520

ARM_COMPUTE_EXPECT(!bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1521

ARM_COMPUTE_EXPECT(!dst.info()->is_resizable(), framework::LogLevel::ERRORS);

1522

1523

// Fill tensors

1524

fill(AccessorType(lhs), 0);

1525

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1526

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Compute GEMM

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1534

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1535

const ActivationLayerInfo &act_info)

giuros01