Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

52

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

54

public:

55

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

56

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

57

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

58

ARM_COMPUTE_UNUSED(pretranspose);

59

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

60

_reference = compute_reference(shape_a, shape_b, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

65

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

66

{

67

switch(tensor.data_type())

68

{

69

case DataType::F16:

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

70

{

Giorgio Arena

a8e2aeb

2021-01-06 11:34:57 +0000

[diff] [blame]

71

arm_compute::utils::uniform_real_distribution_16bit<half> distribution{ float(lo), float(hi) };

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

72

library->fill(tensor, distribution, i);

73

break;

74

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

75

case DataType::F32:

76

{

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

77

std::uniform_real_distribution<float> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

78

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

87

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

88

{

89

// Create tensors

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

90

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

91

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

92

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

93

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

94

95

// Create and configure function

96

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

97

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

98

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

99

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

100

gemm.configure(&a,

101

&b,

102

(disable_c) ? nullptr : &c,

103

&dst,

104

alpha, beta,

Georgios Pinitas

4ee8b15

2021-07-16 16:16:43 +0100

[diff] [blame]

105

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, false, (reinterpret_input_as_3d

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

106

|| reinterpret_output_as_3d)));

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

107

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

108

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

109

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

110

ARM_COMPUTE_ASSERT(dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

111

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

112

add_padding_x({ &a, &b, &c, &dst });

113

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

114

// Allocate tensors

115

a.allocator()->allocate();

116

b.allocator()->allocate();

117

c.allocator()->allocate();

118

dst.allocator()->allocate();

119

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

120

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

121

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

122

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

123

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

124

125

// Fill tensors

126

fill(AccessorType(a), 0);

127

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

128

if(!disable_c)

129

{

130

fill(AccessorType(c), 2);

131

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

132

133

// Compute GEMM function

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

139

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

140

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

141

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

142

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

143

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

144

if(reinterpret_input_as_3d)

145

{

146

// Collapse the second and third dimension if the input is 3D

147

shape_a_to_use.collapse(2U, 1U);

148

}

149

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

150

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

151

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

152

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

153

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

158

fill(c, 2);

159

160

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

161

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

162

const int n = shape_b[0];

163

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

164

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

165

166

// In case of broadcast, we need simply copy the first into the following "M" ones

167

for(int i = 1; i < m * batch_size; i++)

168

{

169

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

170

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

171

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

172

173

// Setting beta to 0 will effectively disable C for the

174

// computation of the reference: alpha * A * B + 0 * C

175

return reference::gemm<T>(a, b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

176

}

177

178

TensorType _target{};

179

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

180

};

181

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

182

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

183

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

184

{

185

public:

186

template <typename...>

187

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

188

DataType data_type, GPUTarget gpu_arch)

189

{

190

// Set the tensor shapes for LHS and RHS matrices

191

const TensorShape lhs_shape(k, m, batch_size);

192

const TensorShape rhs_shape(n, k, batch_size);

193

const TensorShape bias_shape(n,

194

broadcast_bias ? 1 : m,

195

broadcast_bias ? 1 : batch_size);

196

197

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

198

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

203

void fill(U &&tensor, int i)

204

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

205

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

206

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

207

208

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

209

library->fill(tensor, distribution, i);

210

211

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

212

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

213

library->fill_borders_with_garbage(tensor, distribution_inf, i);

214

}

215

216

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

217

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

218

{

219

// Create tensors

220

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

221

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

222

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

223

TensorType dst;

224

225

const unsigned int m = lhs_shape[1];

226

const unsigned int n = rhs_shape[0];

227

const unsigned int k = lhs_shape[0];

228

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

229

230

// The output tensor will be auto-initialized within the function

231

232

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

233

GEMMOperatorType gemm;

234

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

235

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

236

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

237

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

238

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

239

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

240

add_padding_x({ &lhs, &rhs, &bias, &dst });

241

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

242

// Allocate tensors

243

lhs.allocator()->allocate();

244

rhs.allocator()->allocate();

245

bias.allocator()->allocate();

246

dst.allocator()->allocate();

247

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

248

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

249

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

250

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

251

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

252

253

// Fill tensors

254

fill(AccessorType(lhs), 0);

255

fill(AccessorType(rhs), 1);

256

fill(AccessorType(bias), 2);

257

258

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

259

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

260

{ ACL_SRC_1, &rhs },

261

{ ACL_SRC_2, &bias },

262

{ ACL_DST, &dst }

263

});

264

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

269

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

270

const ActivationLayerInfo &act_info)

271

{

272

TensorShape dst_shape = lhs_shape;

273

dst_shape[0] = rhs_shape[0];

274

dst_shape[1] = lhs_shape[1];

275

276

// Create reference

277

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

278

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

279

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

280

281

const int n = rhs_shape[0];

282

const int m = lhs_shape[1];

283

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

293

for(int i = 1; i < m * batch_size; i++)

294

{

295

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

300

}

301

302

TensorType _target{};

303

SimpleTensor<T> _reference{};

304

};

305

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

306

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

307

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

308

{

309

public:

310

template <typename...>

311

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

312

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

313

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

314

ARM_COMPUTE_UNUSED(broadcast_bias);

315

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

316

// In case of GEMM3D, m is the product between m_w and m_h

317

const unsigned int m = m_w * m_h;

318

319

// Set the tensor shapes for LHS and RHS matrices

320

const TensorShape lhs_shape(k, m, batch_size);

321

const TensorShape rhs_shape(n, k, batch_size);

322

const TensorShape bias_shape(n, 1, 1);

323

324

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

325

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

330

void fill(U &&tensor, int i)

331

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

332

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

333

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

334

335

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

336

library->fill(tensor, distribution, i);

337

}

338

339

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

340

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

341

{

342

// Create tensors

343

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

344

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

345

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

346

TensorType dst;

347

348

const unsigned int m = lhs_shape[1];

349

const unsigned int n = rhs_shape[0];

350

const unsigned int k = lhs_shape[0];

351

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

352

353

// The output tensor will be auto-initialized within the function

354

355

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

356

GEMMOperatorType gemm;

357

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

358

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

359

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

360

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

361

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

362

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

363

add_padding_x({ &lhs, &rhs, &bias, &dst });

364

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

365

// Allocate tensors

366

lhs.allocator()->allocate();

367

rhs.allocator()->allocate();

368

bias.allocator()->allocate();

369

dst.allocator()->allocate();

370

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

371

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

372

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

373

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

374

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

375

376

// Fill tensors

377

fill(AccessorType(lhs), 0);

378

fill(AccessorType(rhs), 1);

379

fill(AccessorType(bias), 2);

380

381

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

382

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

383

{ ACL_SRC_1, &rhs },

384

{ ACL_SRC_2, &bias },

385

{ ACL_DST, &dst }

386

});

387

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

392

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

393

const ActivationLayerInfo &act_info)

394

{

395

TensorShape dst_shape = lhs_shape;

396

dst_shape.set(0, rhs_shape[0]);

397

dst_shape.set(1, lhs_shape[1] / m_h);

398

dst_shape.set(2, m_h);

399

dst_shape.set(3, lhs_shape[2]);

400

401

// Create reference

402

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

403

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

404

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

405

406

const int n = rhs_shape[0];

407

const int m = lhs_shape[1];

408

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

416

for(int i = 1; i < m * batch_size; i++)

417

{

418

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

419

}

420

421

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

422

}

423

424

TensorType _target{};

425

SimpleTensor<T> _reference{};

426

};

427

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

428

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

429

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

430

{

431

public:

432

template <typename...>

433

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

434

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

435

{

436

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

441

lhs_info.transpose = true;

442

443

GEMMRHSMatrixInfo rhs_info;

444

rhs_info.n0 = 16 / sizeof(T);

445

rhs_info.k0 = 1;

446

rhs_info.h0 = h0;

447

rhs_info.interleave = false;

448

rhs_info.transpose = false;

449

450

// Set the tensor shapes for LHS and RHS matrices

451

const TensorShape lhs_shape(k, m, batch_size);

452

const TensorShape rhs_shape(n, k, batch_size);

453

const TensorShape bias_shape(n,

454

broadcast_bias ? 1 : m,

455

broadcast_bias ? 1 : batch_size);

456

457

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

458

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

463

void fill(U &&tensor, int i)

464

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

465

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

466

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

467

468

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

469

library->fill(tensor, distribution, i);

470

471

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

472

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

473

library->fill_borders_with_garbage(tensor, distribution_inf, i);

474

}

475

476

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

477

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

478

{

479

// Create tensors

480

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

481

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

482

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

483

TensorType lhs_reshaped;

484

TensorType rhs_reshaped;

485

TensorType dst;

486

487

const unsigned int m = lhs_shape[1];

488

const unsigned int n = rhs_shape[0];

489

const unsigned int k = lhs_shape[0];

490

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

491

492

// The output tensor will be auto-initialized within the function

493

494

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

495

ReshapeLHSOperatorType reshape_lhs;

496

ReshapeRHSOperatorType reshape_rhs;

497

GEMMOperatorType gemm;

498

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

499

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

500

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

501

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

502

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

503

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

504

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

505

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

506

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

507

if(!rhs_info.export_to_cl_image)

508

{

509

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

510

}

511

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

512

// Allocate tensors

513

lhs.allocator()->allocate();

514

rhs.allocator()->allocate();

515

lhs_reshaped.allocator()->allocate();

516

rhs_reshaped.allocator()->allocate();

517

bias.allocator()->allocate();

518

dst.allocator()->allocate();

519

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

520

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

521

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

522

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

523

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

524

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

525

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

526

527

// Fill tensors

528

fill(AccessorType(lhs), 0);

529

fill(AccessorType(rhs), 1);

530

fill(AccessorType(bias), 2);

531

532

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

533

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

534

reshape_lhs.run(reshape_lhs_pack);

535

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

536

reshape_rhs.run(reshape_rhs_pack);

537

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

538

{ ACL_SRC_1, &rhs_reshaped },

539

{ ACL_SRC_2, &bias },

540

{ ACL_DST, &dst }

541

});

542

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

547

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

548

const ActivationLayerInfo &act_info)

549

{

550

TensorShape dst_shape = lhs_shape;

551

dst_shape[0] = rhs_shape[0];

552

dst_shape[1] = lhs_shape[1];

553

554

// Create reference

555

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

556

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

557

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

558

559

const int n = rhs_shape[0];

560

const int m = lhs_shape[1];

561

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

571

for(int i = 1; i < m * batch_size; i++)

572

{

573

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

578

}

579

580

TensorType _target{};

581

SimpleTensor<T> _reference{};

582

};

583

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

584

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

585

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

586

{

587

public:

588

template <typename...>

589

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

590

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

591

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

592

ARM_COMPUTE_UNUSED(broadcast_bias);

593

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

594

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

599

lhs_info.transpose = true;

600

601

GEMMRHSMatrixInfo rhs_info;

602

rhs_info.n0 = 16 / sizeof(T);

603

rhs_info.k0 = 1;

604

rhs_info.h0 = h0;

605

rhs_info.interleave = false;

606

rhs_info.transpose = false;

607

608

// In case of GEMM3D, m is the product between m_w and m_h

609

const unsigned int m = m_w * m_h;

610

611

// Set the tensor shapes for LHS and RHS matrices

612

const TensorShape lhs_shape(k, m, batch_size);

613

const TensorShape rhs_shape(n, k, batch_size);

614

const TensorShape bias_shape(n, 1, 1);

615

616

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

617

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

622

void fill(U &&tensor, int i)

623

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

624

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

625

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

626

627

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

628

library->fill(tensor, distribution, i);

629

}

630

631

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

632

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

633

{

634

// Create tensors

635

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

636

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

637

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

638

TensorType lhs_reshaped;

639

TensorType rhs_reshaped;

640

TensorType dst;

641

642

const unsigned int m = lhs_shape[1];

643

const unsigned int n = rhs_shape[0];

644

const unsigned int k = lhs_shape[0];

645

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

646

647

// The output tensor will be auto-initialized within the function

648

649

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

650

ReshapeLHSOperatorType reshape_lhs;

651

ReshapeRHSOperatorType reshape_rhs;

652

GEMMOperatorType gemm;

653

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

654

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

655

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

656

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

657

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

658

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

659

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

660

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

661

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

662

if(!rhs_info.export_to_cl_image)

663

{

664

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

665

}

666

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

667

// Allocate tensors

668

lhs.allocator()->allocate();

669

rhs.allocator()->allocate();

670

lhs_reshaped.allocator()->allocate();

671

rhs_reshaped.allocator()->allocate();

672

bias.allocator()->allocate();

673

dst.allocator()->allocate();

674

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

675

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

676

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

677

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

678

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

679

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

680

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

681

682

// Fill tensors

683

fill(AccessorType(lhs), 0);

684

fill(AccessorType(rhs), 1);

685

fill(AccessorType(bias), 2);

686

687

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

688

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

689

reshape_lhs.run(reshape_lhs_pack);

690

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

691

reshape_rhs.run(reshape_rhs_pack);

692

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

693

{ ACL_SRC_1, &rhs_reshaped },

694

{ ACL_SRC_2, &bias },

695

{ ACL_DST, &dst }

696

});

697

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

702

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

703

const ActivationLayerInfo &act_info)

704

{

705

TensorShape dst_shape = lhs_shape;

706

dst_shape.set(0, rhs_shape[0]);

707

dst_shape.set(1, lhs_shape[1] / m_h);

708

dst_shape.set(2, m_h);

709

dst_shape.set(3, lhs_shape[2]);

710

711

// Create reference

712

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

713

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

714

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

715

716

const int n = rhs_shape[0];

717

const int m = lhs_shape[1];

718

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

726

for(int i = 1; i < m * batch_size; i++)

727

{

728

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

729

}

730

731

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

732

}

733

734

TensorType _target{};

735

SimpleTensor<T> _reference{};

736

};

737

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

738

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

739

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

740

{

741

public:

742

template <typename...>

743

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

744

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

745

{

746

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

751

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

752

753

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

758

rhs_info.transpose = !lhs_transpose;

759

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

760

761

// Set the tensor shapes for LHS and RHS matrices

762

const TensorShape lhs_shape(k, m, batch_size);

763

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

764

const TensorShape bias_shape(n,

765

broadcast_bias ? 1 : m,

766

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

767

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

768

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

769

if(validate_result)

770

{

771

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

772

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

777

void fill(U &&tensor, int i)

778

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

779

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

780

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

781

782

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

783

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

784

785

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

786

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

787

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

788

}

789

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

790

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

791

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

792

{

793

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

794

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

795

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

796

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

797

TensorType lhs_reshaped;

798

TensorType rhs_reshaped;

799

TensorType dst;

800

801

const unsigned int M = lhs_shape[1];

802

const unsigned int N = rhs_shape[0];

803

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

804

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

809

kernel_info.reinterpret_input_as_3d = false;

810

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

811

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

812

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

813

814

// The output tensor will be auto-initialized within the function

815

816

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

817

ReshapeLHSOperatorType reshape_lhs;

818

ReshapeRHSOperatorType reshape_rhs;

819

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

820

821

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

822

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

828

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

829

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

830

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

831

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

832

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

833

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

834

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

835

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

836

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

837

if(!rhs_info.export_to_cl_image)

838

{

839

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

840

}

841

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

842

// Allocate tensors

843

lhs.allocator()->allocate();

844

rhs.allocator()->allocate();

845

lhs_reshaped.allocator()->allocate();

846

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

847

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

848

dst.allocator()->allocate();

849

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

850

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

851

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

852

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

853

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

854

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

855

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

856

857

// Fill tensors

858

fill(AccessorType(lhs), 0);

859

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

860

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

861

862

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

863

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

864

reshape_lhs.run(reshape_lhs_pack);

865

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

866

reshape_rhs.run(reshape_rhs_pack);

867

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

868

{ ACL_SRC_1, &rhs_reshaped },

869

{ ACL_SRC_2, &bias },

870

{ ACL_DST, &dst }

871

});

872

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

877

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

878

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

879

{

880

TensorShape dst_shape = lhs_shape;

881

dst_shape[0] = rhs_shape[0];

882

dst_shape[1] = lhs_shape[1];

883

884

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

885

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

886

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

887

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

888

889

const int n = rhs_shape[0];

890

const int m = lhs_shape[1];

891

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

896

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

897

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

898

if(broadcast_bias)

899

{

900

// In case of broadcast, we need simply copy the first into the following "M" ones

901

for(int i = 1; i < m * batch_size; i++)

902

{

903

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

907

if(fp_mixed_precision)

908

{

909

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

914

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

915

}

916

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

917

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

918

TensorType _target{};

919

SimpleTensor<T> _reference{};

920

};

921

SiCongLi

1af5416

2021-10-06 15:25:57 +0100

[diff] [blame]

922

/** (EXPERIMENTAL_POST_OPS)*/

923

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

924

class GEMMMatrixMultiplyReshapedWithPostOpsValidationFixture : public framework::Fixture

925

{

926

public:

927

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

928

public:

929

template <typename...>

930

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

931

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info,

932

const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

933

{

934

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

939

lhs_info.transpose = lhs_transpose;

940

941

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

946

rhs_info.transpose = !lhs_transpose;

947

rhs_info.export_to_cl_image = export_to_cl_image;

948

949

// Set the tensor shapes for LHS and RHS matrices

950

const TensorShape lhs_shape(k, m, batch_size);

951

const TensorShape rhs_shape(n, k, batch_size);

952

const TensorShape bias_shape(n,

953

broadcast_bias ? 1 : m,

954

broadcast_bias ? 1 : batch_size);

955

auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

956

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

961

std::get<1>(broadcast) ? 1 : m,

962

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

967

if(validate_result)

968

{

969

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

}

protected:

template <typename U>

975

void fill(U &&tensor, int i)

976

{

977

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

978

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

979

980

DistributionType distribution{ T(-1.0f), T(1.0f) };

981

library->fill(tensor, distribution, i);

982

983

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

984

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

985

library->fill_borders_with_garbage(tensor, distribution_inf, i);

986

}

987

988

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

989

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

990

{

991

// Create tensors

992

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

993

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

994

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

995

996

// Create post op tensors and populate post op with them

997

std::vector<TensorType> post_op_tensors_holder{};

998

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

999

[&post_op_tensors_holder, &data_type](auto shape)

1000

{

1001

auto t = create_tensor<TensorType>(shape, data_type, 1);

1002

post_op_tensors_holder.push_back(std::move(t));

1003

return post_op_tensors_holder.back().info();

1004

});

1005

TensorType lhs_reshaped;

1006

TensorType rhs_reshaped;

1007

TensorType dst;

1008

1009

const unsigned int M = lhs_shape[1];

1010

const unsigned int N = rhs_shape[0];

1011

const unsigned int K = lhs_shape[0];

1012

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1017

kernel_info.reinterpret_input_as_3d = false;

1018

kernel_info.broadcast_bias = broadcast_bias;

1019

kernel_info.activation_info = act_info;

1020

kernel_info.fp_mixed_precision = fp_mixed_precision;

1021

kernel_info.post_ops = populated_post_ops;

1022

1023

// The output tensor will be auto-initialized within the function

1024

1025

// Create and configure function

1026

ReshapeLHSOperatorType reshape_lhs;

1027

ReshapeRHSOperatorType reshape_rhs;

1028

GEMMOperatorType gemm;

1029

1030

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1031

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1038

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1039

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

1040

1041

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1042

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1043

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1044

for(const auto &tensor : post_op_tensors_holder)

1045

{

1046

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

1047

}

1048

1049

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

1050

if(!rhs_info.export_to_cl_image)

1051

{

1052

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1053

for(auto &tensor : post_op_tensors_holder)

1054

{

1055

add_padding_x({ &tensor });

}

}

// Allocate tensors

lhs.allocator()->allocate();

1061

rhs.allocator()->allocate();

1062

lhs_reshaped.allocator()->allocate();

1063

rhs_reshaped.allocator()->allocate();

1064

bias.allocator()->allocate();

1065

dst.allocator()->allocate();

1066

for(auto &tensor : post_op_tensors_holder)

1067

{

1068

tensor.allocator()->allocate();

1069

}

1070

1071

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1072

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1073

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1074

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1075

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1076

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1077

for(const auto &tensor : post_op_tensors_holder)

1078

{

1079

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

1084

fill(AccessorType(rhs), 1);

1085

fill(AccessorType(bias), 2);

1086

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1087

{

1088

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1093

reshape_lhs.run(reshape_lhs_pack);

1094

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1095

reshape_rhs.run(reshape_rhs_pack);

1096

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1097

{ ACL_SRC_1, &rhs_reshaped },

1098

{ ACL_SRC_2, &bias },

1099

{ ACL_DST, &dst }

1100

});

1101

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1102

{

1103

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1111

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1112

{

1113

TensorShape dst_shape = lhs_shape;

1114

dst_shape[0] = rhs_shape[0];

1115

dst_shape[1] = lhs_shape[1];

1116

1117

// Create reference

1118

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1119

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1120

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1121

// Create post op tensors and populate post op with them

1122

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

1123

{

1124

return SimpleTensor<T> { shape, data_type, 1 };

1125

});

1126

1127

const int n = rhs_shape[0];

1128

const int m = lhs_shape[1];

1129

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

1134

fill(rhs, tensor_idx++);

1135

fill(bias, tensor_idx++);

1136

for(auto &op : populated_post_ops.get_list())

1137

{

1138

for(auto tensor : op->arguments())

1139

{

1140

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

1147

for(int i = 1; i < m * batch_size; i++)

1148

{

1149

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

if(fp_mixed_precision)

1155

{

1156

out = reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta);

}

else

{

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

1161

}

1162

// Ignore activation info if post ops are used instead

1163

if(populated_post_ops.size() > 0)

1164

{

1165

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

bool validate_result = true;

1175

TensorType _target{};

1176

SimpleTensor<T> _reference{};

1177

};

1178

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1179

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1180

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

1181

{

1182

public:

1183

template <typename...>

1184

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

1185

bool interleave_lhs, bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1186

{

1187

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

1192

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1193

1194

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1199

rhs_info.transpose = !lhs_transpose;

1200

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1201

1202

// In case of GEMM3D, m is the product between m_w and m_h

1203

const unsigned int m = m_w * m_h;

1204

1205

// Set the tensor shapes for LHS and RHS matrices

1206

const TensorShape lhs_shape(k, m, batch_size);

1207

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1208

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1209

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1210

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

1211

if(validate_result)

1212

{

1213

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1214

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

1219

void fill(U &&tensor, int i)

1220

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1221

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1222

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1223

1224

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1225

library->fill(tensor, distribution, i);

1226

}

1227

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1228

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1229

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1230

{

1231

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1232

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1233

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1234

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1235

TensorType lhs_reshaped;

1236

TensorType rhs_reshaped;

1237

TensorType dst;

1238

1239

const unsigned int M = lhs_shape[1];

1240

const unsigned int N = rhs_shape[0];

1241

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1242

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1247

kernel_info.reinterpret_input_as_3d = false;

1248

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1249

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1250

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1251

1252

// The output tensor will be auto-initialized within the function

1253

1254

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1255

ReshapeLHSOperatorType reshape_lhs;

1256

ReshapeRHSOperatorType reshape_rhs;

1257

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1258

1259

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1260

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1266

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1267

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1268

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1269

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1270

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1271

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1272

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1273

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1274

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1275

if(!rhs_info.export_to_cl_image)

1276

{

1277

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1278

}

1279

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1280

// Allocate tensors

1281

lhs.allocator()->allocate();

1282

rhs.allocator()->allocate();

1283

lhs_reshaped.allocator()->allocate();

1284

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1285

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1286

dst.allocator()->allocate();

1287

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1288

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1289

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1290

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1291

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1292

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1293

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1294

1295

// Fill tensors

1296

fill(AccessorType(lhs), 0);

1297

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1298

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1299

1300

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1301

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1302

reshape_lhs.run(reshape_lhs_pack);

1303

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1304

reshape_rhs.run(reshape_rhs_pack);

1305

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1306

{ ACL_SRC_1, &rhs_reshaped },

1307

{ ACL_SRC_2, &bias },

1308

{ ACL_DST, &dst }

1309

});

1310

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1315

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1316

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1317

{

1318

TensorShape dst_shape = lhs_shape;

1319

dst_shape.set(0, rhs_shape[0]);

1320

dst_shape.set(1, lhs_shape[1] / m_h);

1321

dst_shape.set(2, m_h);

1322

dst_shape.set(3, lhs_shape[2]);

1323

1324

// Create reference

1325

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1326

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1327

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1328

1329

const int n = rhs_shape[0];

1330

const int m = lhs_shape[1];

1331

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1336

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1337

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1338

// In case of broadcast, we need simply copy the first into the following "M" ones

1339

for(int i = 1; i < m * batch_size; i++)

1340

{

1341

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1342

}

1343

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1344

if(fp_mixed_precision)

1345

{

1346

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

1351

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1352

}

1353

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1354

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1355

TensorType _target{};

1356

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

1357

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1358

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1359

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1360

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1361

{

1362

public:

1363

template <typename...>

1364

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

1365

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1366

{

1367

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1376

rhs_info.transpose = transpose_rhs;

1377

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1378

1379

// Set the tensor shapes for LHS and RHS matrices

1380

const TensorShape lhs_shape(k, m, batch_size);

1381

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1382

const TensorShape bias_shape(n,

1383

broadcast_bias ? 1 : m,

1384

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1385

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1386

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1387

if(validate_result)

1388

{

1389

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

1390

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1395

void fill(U &&tensor, int i)

1396

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1397

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1398

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1399

1400

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1401

library->fill(tensor, distribution, i);

1402

1403

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1404

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1405

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1406

}

1407

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1408

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1409

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1410

{

1411

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1412

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1413

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1414

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1415

TensorType rhs_reshaped;

1416

TensorType dst;

1417

1418

const unsigned int M = lhs_shape[1];

1419

const unsigned int N = rhs_shape[0];

1420

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1421

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1426

kernel_info.reinterpret_input_as_3d = false;

1427

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1428

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1429

1430

// The output tensor will be auto-initialized within the function

1431

1432

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1433

ReshapeRHSOperatorType reshape_rhs;

1434

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1435

1436

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1437

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1443

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1444

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1445

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1446

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1447

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1448

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1449

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1450

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1451

if(!rhs_info.export_to_cl_image)

1452

{

1453

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1454

}

1455

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1456

// Allocate tensors

1457

lhs.allocator()->allocate();

1458

rhs.allocator()->allocate();

1459

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1460

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1461

dst.allocator()->allocate();

1462

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1463

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1464

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1465

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1466

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1467

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1468

1469

// Fill tensors

1470

fill(AccessorType(lhs), 0);

1471

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1472

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1473

1474

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1475

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1476

reshape_rhs.run(reshape_rhs_pack);

1477

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1478

{ ACL_SRC_1, &rhs_reshaped },

1479

{ ACL_SRC_2, &bias },

1480

{ ACL_DST, &dst }

1481

});

1482

gemm.run(gemm_pack);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1487

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1488

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1489

{

1490

TensorShape dst_shape = lhs_shape;

1491

dst_shape[0] = rhs_shape[0];

1492

dst_shape[1] = lhs_shape[1];

1493

1494

// Create reference

1495

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1496

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1497

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1498

1499

const int n = rhs_shape[0];

1500

const int m = lhs_shape[1];

1501

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1506

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1507

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1508

if(broadcast_bias)

1509

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1510

// In case of broadcast, we need simply copy the first into the following "M" ones

1511

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1512

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1513

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1514

}

1515

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1516

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1517

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1518

}

1519

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1520

bool validate_result = true;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1521

TensorType _target{};

1522

SimpleTensor<T> _reference{};

1523

};

1524

SiCongLi

afa1972

2021-10-24 19:12:33 +0100

[diff] [blame]

1525

/** (EXPERIMENTAL_POST_OPS)*/

1526

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

1527

class GEMMMatrixMultiplyReshapedOnlyRHSWithPostOpsValidationFixture : public framework::Fixture

1528

{

1529

public:

1530

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

1531

template <typename...>

1532

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

1533

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info,

1534

const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

1535

{

1536

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1545

rhs_info.transpose = transpose_rhs;

1546

rhs_info.export_to_cl_image = export_to_cl_image;

1547

1548

// Set the tensor shapes for LHS and RHS matrices

1549

const TensorShape lhs_shape(k, m, batch_size);

1550

const TensorShape rhs_shape(n, k, batch_size);

1551

const TensorShape bias_shape(n,

1552

broadcast_bias ? 1 : m,

1553

broadcast_bias ? 1 : batch_size);

1554

auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

1555

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

1560

std::get<1>(broadcast) ? 1 : m,

1561

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

1566

if(validate_result)

1567

{

1568

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

}

protected:

template <typename U>

1574

void fill(U &&tensor, int i)

1575

{

1576

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

1577

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

1578

1579

DistributionType distribution{ T(-1.0f), T(1.0f) };

1580

library->fill(tensor, distribution, i);

1581

1582

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1583

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

1584

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1585

}

1586

1587

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1588

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1589

{

1590

// Create tensors

1591

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1592

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1593

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1594

TensorType rhs_reshaped;

1595

TensorType dst;

1596

// Create post op tensors and populate post op with them

1597

std::vector<TensorType> post_op_tensors_holder{};

1598

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

1599

[&post_op_tensors_holder, &data_type](auto shape)

1600

{

1601

auto t = create_tensor<TensorType>(shape, data_type, 1);

1602

post_op_tensors_holder.push_back(std::move(t));

1603

return post_op_tensors_holder.back().info();

1604

});

1605

1606

const unsigned int M = lhs_shape[1];

1607

const unsigned int N = rhs_shape[0];

1608

const unsigned int K = lhs_shape[0];

1609

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1614

kernel_info.reinterpret_input_as_3d = false;

1615

kernel_info.broadcast_bias = broadcast_bias;

1616

kernel_info.activation_info = act_info;

1617

kernel_info.post_ops = populated_post_ops;

1618

1619

// The output tensor will be auto-initialized within the function

1620

1621

// Create and configure function

1622

ReshapeRHSOperatorType reshape_rhs;

1623

GEMMOperatorType gemm;

1624

1625

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1626

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1633

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

1634

1635

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1636

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1637

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1638

for(const auto &tensor : post_op_tensors_holder)

1639

{

1640

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

1641

}

1642

1643

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

1644

if(!rhs_info.export_to_cl_image)

1645

{

1646

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1647

for(auto &tensor : post_op_tensors_holder)

1648

{

1649

add_padding_x({ &tensor });

}

}

// Allocate tensors

lhs.allocator()->allocate();

1655

rhs.allocator()->allocate();

1656

rhs_reshaped.allocator()->allocate();

1657

bias.allocator()->allocate();

1658

dst.allocator()->allocate();

1659

for(auto &tensor : post_op_tensors_holder)

1660

{

1661

tensor.allocator()->allocate();

1662

}

1663

1664

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1665

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1666

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1667

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1668

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1669

for(const auto &tensor : post_op_tensors_holder)

1670

{

1671

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

1676

fill(AccessorType(rhs), 1);

1677

fill(AccessorType(bias), 2);

1678

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1679

{

1680

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1685

reshape_rhs.run(reshape_rhs_pack);

1686

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1687

{ ACL_SRC_1, &rhs_reshaped },

1688

{ ACL_SRC_2, &bias },

1689

{ ACL_DST, &dst }

1690

});

1691

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1692

{

1693

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1701

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1702

{

1703

TensorShape dst_shape = lhs_shape;

1704

dst_shape[0] = rhs_shape[0];

1705

dst_shape[1] = lhs_shape[1];

1706

1707

// Create reference

1708

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1709

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1710

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1711

// Create post op tensors and populate post op with them

1712

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

1713

{

1714

return SimpleTensor<T> { shape, data_type, 1 };

1715

});

1716

1717

const int n = rhs_shape[0];

1718

const int m = lhs_shape[1];

1719

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

1724

fill(rhs, tensor_idx++);

1725

fill(bias, tensor_idx++);

1726

for(auto &op : populated_post_ops.get_list())

1727

{

1728

for(auto tensor : op->arguments())

1729

{

1730

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

1737

for(int i = 1; i < m * batch_size; i++)

1738

{

1739

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

1745

// Ignore activation info if post ops are used instead

1746

if(populated_post_ops.size() > 0)

1747

{

1748

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

bool validate_result = true;

1758

TensorType _target{};

1759

SimpleTensor<T> _reference{};

1760

};

1761

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1762

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1763

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1764

{

1765

public:

1766

template <typename...>

1767

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1768

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, bool has_pad_y, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1769

{

1770

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1779

rhs_info.transpose = transpose_rhs;

1780

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1781

1782

// In case of GEMM3D, m is the product between m_w and m_h

1783

const unsigned int m = m_w * m_h;

1784

1785

// Set the tensor shapes for LHS and RHS matrices

1786

const TensorShape lhs_shape(k, m, batch_size);

1787

const TensorShape rhs_shape(n, k, batch_size);

1788

const TensorShape bias_shape(n, 1, 1);

1789

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1790

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info, has_pad_y);

1791

if(validate_result)

1792

{

1793

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1794

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1799

void fill(U &&tensor, int i)

1800

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1801

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1802

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1803

1804

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1805

library->fill(tensor, distribution, i);

1806

}

1807

1808

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1809

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1810

unsigned int m_h, const ActivationLayerInfo &act_info, bool has_pad_y)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1811

{

1812

// Create tensors

1813

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1814

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1815

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1816

TensorType rhs_reshaped;

1817

TensorType dst;

1818

1819

const unsigned int M = lhs_shape[1];

1820

const unsigned int N = rhs_shape[0];

1821

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1822

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1827

kernel_info.reinterpret_input_as_3d = false;

1828

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1829

kernel_info.activation_info = act_info;

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1830

kernel_info.has_pad_y = has_pad_y;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1831

1832

// The output tensor will be auto-initialized within the function

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1833

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1834

ReshapeRHSOperatorType reshape_rhs;

1835

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1836

1837

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1838

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1844

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1845

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1846

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1847

if(has_pad_y)

1848

{

1849

// Add dummy padding into lhs to validate has_pad_y path

1850

lhs.info()->extend_padding(PaddingSize(2, 0, 2, 0));

1851

dst.info()->extend_padding(PaddingSize(2, 0, 1, 0));

1852

}

1853

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1854

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1855

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1856

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1857

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1858

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1859

if(!rhs_info.export_to_cl_image)

1860

{

1861

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1862

}

1863

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1864

// Allocate tensors

1865

lhs.allocator()->allocate();

1866

rhs.allocator()->allocate();

1867

rhs_reshaped.allocator()->allocate();

1868

bias.allocator()->allocate();

1869

dst.allocator()->allocate();

1870

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1871

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1872

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1873

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1874

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1875

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1876

1877

// Fill tensors

1878

fill(AccessorType(lhs), 0);

1879

fill(AccessorType(rhs), 1);

1880

fill(AccessorType(bias), 2);

1881

1882

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1883

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1884

reshape_rhs.run(reshape_rhs_pack);

1885

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1886

{ ACL_SRC_1, &rhs_reshaped },

1887

{ ACL_SRC_2, &bias },

1888

{ ACL_DST, &dst }

1889

});

1890

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1895

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1896

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1897

{

1898

TensorShape dst_shape = lhs_shape;

1899

dst_shape.set(0, rhs_shape[0]);

1900

dst_shape.set(1, lhs_shape[1] / m_h);

1901

dst_shape.set(2, m_h);

1902

dst_shape.set(3, lhs_shape[2]);

1903

1904

// Create reference

1905

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1906

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1907

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1908

1909

const int n = rhs_shape[0];

1910

const int m = lhs_shape[1];

1911

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

1919

for(int i = 1; i < m * batch_size; i++)

1920

{

1921

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1922

}

1923

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1924

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1925

}

1926

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1927

bool validate_result = true;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1928

TensorType _target{};

1929

SimpleTensor<T> _reference{};

1930

};

1931

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1932

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1933

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1934

{

1935

public:

1936

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1937

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1938

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1939

{

1940

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1949

const TensorShape lhs_shape(k, m, batch_size);

1950

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1951

const TensorShape bias_shape(n,

1952

broadcast_bias ? 1 : m,

1953

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1954

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1955

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1956

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1961

void fill(U &&tensor, int i)

1962

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1963

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1964

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1965

1966

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1967

library->fill(tensor, distribution, i);

1968

1969

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1970

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1971

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1972

}

1973

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1974

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1975

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1976

{

1977

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1978

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1979

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1980

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1981

TensorType dst;

1982

1983

const unsigned int M = lhs_shape[1];

1984

const unsigned int N = rhs_shape[0];

1985

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1986

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1991

kernel_info.reinterpret_input_as_3d = false;

1992

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1993

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1994

1995

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1996

GEMMOperatorType gemm;

1997

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1998

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1999

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2000

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2001

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2002

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2003

add_padding_x({ &lhs, &rhs, &bias, &dst });

2004

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2005

// Allocate tensors

2006

lhs.allocator()->allocate();

2007

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2008

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2009

dst.allocator()->allocate();

2010

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2011

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2012

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2013

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2014

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2015

2016

// Fill tensors

2017

fill(AccessorType(lhs), 0);

2018

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2019

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2020

2021

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2022

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2023

{ ACL_SRC_1, &rhs },

2024

{ ACL_SRC_2, &bias },

2025

{ ACL_DST, &dst }

2026

});

2027

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2032

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2033

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2034

{

2035

TensorShape dst_shape = lhs_shape;

2036

dst_shape[0] = rhs_shape[0];

2037

dst_shape[1] = lhs_shape[1];

2038

2039

// Create reference

2040

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2041

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2042

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2043

2044

const int n = rhs_shape[0];

2045

const int m = lhs_shape[1];

2046

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2051

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2052

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2053

if(broadcast_bias)

2054

{

2055

// In case of broadcast, we need simply copy the first into the following "M" ones

2056

for(int i = 1; i < m * batch_size; i++)

2057

{

2058

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2062

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2063

}

2064

2065

TensorType _target{};

2066

SimpleTensor<T> _reference{};

2067

};

2068

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2069

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

SiCongLi

afa1972

2021-10-24 19:12:33 +0100

[diff] [blame]

2070

class GEMMMatrixMultiplyNativeWithPostOpsValidationFixture : public framework::Fixture

2071

{

2072

public:

2073

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

2074

public:

2075

template <typename...>

2076

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

2077

const ActivationLayerInfo &act_info, const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

2078

{

2079

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

2088

const TensorShape lhs_shape(k, m, batch_size);

2089

const TensorShape rhs_shape(n, k, batch_size);

2090

const TensorShape bias_shape(n,

2091

broadcast_bias ? 1 : m,

2092

broadcast_bias ? 1 : batch_size);

2093

const auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

2094

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

2099

std::get<1>(broadcast) ? 1 : m,

2100

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

2105

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

protected:

template <typename U>

2110

void fill(U &&tensor, int i)

2111

{

2112

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

2113

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

2114

2115

DistributionType distribution{ T(-1.0f), T(1.0f) };

2116

library->fill(tensor, distribution, i);

2117

2118

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

2119

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

2120

library->fill_borders_with_garbage(tensor, distribution_inf, i);

2121

}

2122

2123

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

2124

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

2125

{

2126

// Create tensors

2127

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2128

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2129

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

2130

TensorType dst;

2131

// Create post op tensors and populate post op with them

2132

std::vector<TensorType> post_op_tensors_holder{};

2133

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

2134

[&post_op_tensors_holder, &data_type](auto shape)

2135

{

2136

auto t = create_tensor<TensorType>(shape, data_type, 1);

2137

post_op_tensors_holder.push_back(std::move(t));

2138

return post_op_tensors_holder.back().info();

2139

});

2140

2141

const unsigned int M = lhs_shape[1];

2142

const unsigned int N = rhs_shape[0];

2143

const unsigned int K = lhs_shape[0];

2144

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

2149

kernel_info.reinterpret_input_as_3d = false;

2150

kernel_info.broadcast_bias = broadcast_bias;

2151

kernel_info.activation_info = act_info;

2152

kernel_info.post_ops = populated_post_ops;

2153

2154

// Create and configure function

2155

GEMMOperatorType gemm;

2156

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

2157

2158

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2159

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2160

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

2161

for(const auto &tensor : post_op_tensors_holder)

2162

{

2163

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

2164

}

2165

2166

add_padding_x({ &lhs, &rhs, &bias, &dst });

2167

for(auto &tensor : post_op_tensors_holder)

2168

{

2169

add_padding_x({ &tensor });

}

// Allocate tensors

lhs.allocator()->allocate();

2174

rhs.allocator()->allocate();

2175

bias.allocator()->allocate();

2176

dst.allocator()->allocate();

2177

for(auto &tensor : post_op_tensors_holder)

2178

{

2179

tensor.allocator()->allocate();

2180

}

2181

2182

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2183

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2184

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2185

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

2186

for(const auto &tensor : post_op_tensors_holder)

2187

{

2188

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

2193

fill(AccessorType(rhs), 1);

2194

fill(AccessorType(bias), 2);

2195

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

2196

{

2197

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2202

{ ACL_SRC_1, &rhs },

2203

{ ACL_SRC_2, &bias },

2204

{ ACL_DST, &dst }

2205

});

2206

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

2207

{

2208

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

2216

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

2217

{

2218

TensorShape dst_shape = lhs_shape;

2219

dst_shape[0] = rhs_shape[0];

2220

dst_shape[1] = lhs_shape[1];

2221

2222

// Create reference

2223

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2224

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

2225

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2226

// Create post op tensors and populate post op with them

2227

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

2228

{

2229

return SimpleTensor<T> { shape, data_type, 1 };

2230

});

2231

2232

const int n = rhs_shape[0];

2233

const int m = lhs_shape[1];

2234

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

2239

fill(rhs, tensor_idx++);

2240

fill(bias, tensor_idx++);

2241

for(auto &op : populated_post_ops.get_list())

2242

{

2243

for(auto tensor : op->arguments())

2244

{

2245

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

2252

for(int i = 1; i < m * batch_size; i++)

2253

{

2254

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

2260

// Ignore activation info if post ops are used instead

2261

if(populated_post_ops.size() > 0)

2262

{

2263

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

TensorType _target{};

2273

SimpleTensor<T> _reference{};

2274

};

2275

2276

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2277

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

2278

{

2279

public:

2280

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2281

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

2282

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2283

{

2284

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

2293

const unsigned int m = m_w * m_h;

2294

2295

// Set the tensor shapes for LHS and RHS matrices

2296

const TensorShape lhs_shape(k, m, batch_size);

2297

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2298

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2299

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2300

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2301

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

2306

void fill(U &&tensor, int i)

2307

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2308

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

2309

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2310

2311

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2312

library->fill(tensor, distribution, i);

2313

}

2314

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2315

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2316

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2317

{

2318

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2319

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2320

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2321

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2322

TensorType dst;

2323

2324

const unsigned int M = lhs_shape[1];

2325

const unsigned int N = rhs_shape[0];

2326

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

2327

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

2332

kernel_info.reinterpret_input_as_3d = false;

2333

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2334

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2335

2336

// The output tensor will be auto-initialized within the function

2337

2338

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2339

GEMMOperatorType gemm;

2340

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2341

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2342

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2343

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2344

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2345

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2346

add_padding_x({ &lhs, &rhs, &bias, &dst });

2347

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2348

// Allocate tensors

2349

lhs.allocator()->allocate();

2350

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2351

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2352

dst.allocator()->allocate();

2353

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2354

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2355

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2356

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2357

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2358

2359

// Fill tensors

2360

fill(AccessorType(lhs), 0);

2361

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2362

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2363

2364

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2365

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2366

{ ACL_SRC_1, &rhs },

2367

{ ACL_SRC_2, &bias },

2368

{ ACL_DST, &dst }

2369

});

2370

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2375

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2376

const ActivationLayerInfo &act_info)

giuros01