Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

52

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

54

public:

55

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

56

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

57

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

58

ARM_COMPUTE_UNUSED(pretranspose);

59

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

60

_reference = compute_reference(shape_a, shape_b, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

65

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

66

{

67

switch(tensor.data_type())

68

{

69

case DataType::F16:

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

70

{

Giorgio Arena

a8e2aeb

2021-01-06 11:34:57 +0000

[diff] [blame]

71

arm_compute::utils::uniform_real_distribution_16bit<half> distribution{ float(lo), float(hi) };

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

72

library->fill(tensor, distribution, i);

73

break;

74

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

75

case DataType::F32:

76

{

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

77

std::uniform_real_distribution<float> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

78

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

87

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

88

{

89

// Create tensors

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

90

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

91

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

92

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

93

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

94

95

// Create and configure function

96

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

97

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

98

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

99

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

100

gemm.configure(&a,

101

&b,

102

(disable_c) ? nullptr : &c,

103

&dst,

104

alpha, beta,

Georgios Pinitas

4ee8b15

2021-07-16 16:16:43 +0100

[diff] [blame]

105

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, false, (reinterpret_input_as_3d

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

106

|| reinterpret_output_as_3d)));

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

107

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

108

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

109

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

110

ARM_COMPUTE_ASSERT(dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

111

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

112

add_padding_x({ &a, &b, &c, &dst });

113

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

114

// Allocate tensors

115

a.allocator()->allocate();

116

b.allocator()->allocate();

117

c.allocator()->allocate();

118

dst.allocator()->allocate();

119

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

120

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

121

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

122

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

123

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

124

125

// Fill tensors

126

fill(AccessorType(a), 0);

127

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

128

if(!disable_c)

129

{

130

fill(AccessorType(c), 2);

131

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

132

133

// Compute GEMM function

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

139

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

140

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

141

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

142

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

143

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

144

if(reinterpret_input_as_3d)

145

{

146

// Collapse the second and third dimension if the input is 3D

147

shape_a_to_use.collapse(2U, 1U);

148

}

149

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

150

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

151

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

152

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

153

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

158

fill(c, 2);

159

160

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

161

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

162

const int n = shape_b[0];

163

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

164

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

165

166

// In case of broadcast, we need simply copy the first into the following "M" ones

167

for(int i = 1; i < m * batch_size; i++)

168

{

169

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

170

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

171

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

172

173

// Setting beta to 0 will effectively disable C for the

174

// computation of the reference: alpha * A * B + 0 * C

175

return reference::gemm<T>(a, b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

176

}

177

178

TensorType _target{};

179

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

180

};

181

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

182

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

183

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

184

{

185

public:

186

template <typename...>

187

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

188

DataType data_type, GPUTarget gpu_arch)

189

{

190

// Set the tensor shapes for LHS and RHS matrices

191

const TensorShape lhs_shape(k, m, batch_size);

192

const TensorShape rhs_shape(n, k, batch_size);

193

const TensorShape bias_shape(n,

194

broadcast_bias ? 1 : m,

195

broadcast_bias ? 1 : batch_size);

196

197

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

198

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

203

void fill(U &&tensor, int i)

204

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

205

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

206

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

207

208

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

209

library->fill(tensor, distribution, i);

210

211

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

212

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

213

library->fill_borders_with_garbage(tensor, distribution_inf, i);

214

}

215

216

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

217

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

218

{

219

// Create tensors

220

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

221

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

222

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

223

TensorType dst;

224

225

const unsigned int m = lhs_shape[1];

226

const unsigned int n = rhs_shape[0];

227

const unsigned int k = lhs_shape[0];

228

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

229

230

// The output tensor will be auto-initialized within the function

231

232

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

233

GEMMOperatorType gemm;

234

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

235

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

236

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

237

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

238

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

239

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

240

add_padding_x({ &lhs, &rhs, &bias, &dst });

241

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

242

// Allocate tensors

243

lhs.allocator()->allocate();

244

rhs.allocator()->allocate();

245

bias.allocator()->allocate();

246

dst.allocator()->allocate();

247

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

248

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

249

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

250

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

251

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

252

253

// Fill tensors

254

fill(AccessorType(lhs), 0);

255

fill(AccessorType(rhs), 1);

256

fill(AccessorType(bias), 2);

257

258

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

259

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

260

{ ACL_SRC_1, &rhs },

261

{ ACL_SRC_2, &bias },

262

{ ACL_DST, &dst }

263

});

264

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

269

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

270

const ActivationLayerInfo &act_info)

271

{

272

TensorShape dst_shape = lhs_shape;

273

dst_shape[0] = rhs_shape[0];

274

dst_shape[1] = lhs_shape[1];

275

276

// Create reference

277

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

278

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

279

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

280

281

const int n = rhs_shape[0];

282

const int m = lhs_shape[1];

283

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

293

for(int i = 1; i < m * batch_size; i++)

294

{

295

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

300

}

301

302

TensorType _target{};

303

SimpleTensor<T> _reference{};

304

};

305

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

306

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

307

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

308

{

309

public:

310

template <typename...>

311

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

312

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

313

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

314

ARM_COMPUTE_UNUSED(broadcast_bias);

315

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

316

// In case of GEMM3D, m is the product between m_w and m_h

317

const unsigned int m = m_w * m_h;

318

319

// Set the tensor shapes for LHS and RHS matrices

320

const TensorShape lhs_shape(k, m, batch_size);

321

const TensorShape rhs_shape(n, k, batch_size);

322

const TensorShape bias_shape(n, 1, 1);

323

324

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

325

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

330

void fill(U &&tensor, int i)

331

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

332

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

333

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

334

335

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

336

library->fill(tensor, distribution, i);

337

}

338

339

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

340

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

341

{

342

// Create tensors

343

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

344

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

345

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

346

TensorType dst;

347

348

const unsigned int m = lhs_shape[1];

349

const unsigned int n = rhs_shape[0];

350

const unsigned int k = lhs_shape[0];

351

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

352

353

// The output tensor will be auto-initialized within the function

354

355

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

356

GEMMOperatorType gemm;

357

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

358

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

359

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

360

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

361

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

362

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

363

add_padding_x({ &lhs, &rhs, &bias, &dst });

364

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

365

// Allocate tensors

366

lhs.allocator()->allocate();

367

rhs.allocator()->allocate();

368

bias.allocator()->allocate();

369

dst.allocator()->allocate();

370

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

371

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

372

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

373

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

374

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

375

376

// Fill tensors

377

fill(AccessorType(lhs), 0);

378

fill(AccessorType(rhs), 1);

379

fill(AccessorType(bias), 2);

380

381

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

382

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

383

{ ACL_SRC_1, &rhs },

384

{ ACL_SRC_2, &bias },

385

{ ACL_DST, &dst }

386

});

387

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

392

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

393

const ActivationLayerInfo &act_info)

394

{

395

TensorShape dst_shape = lhs_shape;

396

dst_shape.set(0, rhs_shape[0]);

397

dst_shape.set(1, lhs_shape[1] / m_h);

398

dst_shape.set(2, m_h);

399

dst_shape.set(3, lhs_shape[2]);

400

401

// Create reference

402

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

403

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

404

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

405

406

const int n = rhs_shape[0];

407

const int m = lhs_shape[1];

408

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

416

for(int i = 1; i < m * batch_size; i++)

417

{

418

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

419

}

420

421

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

422

}

423

424

TensorType _target{};

425

SimpleTensor<T> _reference{};

426

};

427

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

428

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

429

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

430

{

431

public:

432

template <typename...>

433

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

434

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

435

{

436

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

441

lhs_info.transpose = true;

442

443

GEMMRHSMatrixInfo rhs_info;

444

rhs_info.n0 = 16 / sizeof(T);

445

rhs_info.k0 = 1;

446

rhs_info.h0 = h0;

447

rhs_info.interleave = false;

448

rhs_info.transpose = false;

449

450

// Set the tensor shapes for LHS and RHS matrices

451

const TensorShape lhs_shape(k, m, batch_size);

452

const TensorShape rhs_shape(n, k, batch_size);

453

const TensorShape bias_shape(n,

454

broadcast_bias ? 1 : m,

455

broadcast_bias ? 1 : batch_size);

456

457

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

458

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

463

void fill(U &&tensor, int i)

464

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

465

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

466

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

467

468

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

469

library->fill(tensor, distribution, i);

470

471

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

472

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

473

library->fill_borders_with_garbage(tensor, distribution_inf, i);

474

}

475

476

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

477

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

478

{

479

// Create tensors

480

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

481

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

482

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

483

TensorType lhs_reshaped;

484

TensorType rhs_reshaped;

485

TensorType dst;

486

487

const unsigned int m = lhs_shape[1];

488

const unsigned int n = rhs_shape[0];

489

const unsigned int k = lhs_shape[0];

490

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

491

492

// The output tensor will be auto-initialized within the function

493

494

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

495

ReshapeLHSOperatorType reshape_lhs;

496

ReshapeRHSOperatorType reshape_rhs;

497

GEMMOperatorType gemm;

498

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

499

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

500

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

501

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

502

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

503

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

504

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

505

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

506

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

507

if(!rhs_info.export_to_cl_image)

508

{

509

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

510

}

511

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

512

// Allocate tensors

513

lhs.allocator()->allocate();

514

rhs.allocator()->allocate();

515

lhs_reshaped.allocator()->allocate();

516

rhs_reshaped.allocator()->allocate();

517

bias.allocator()->allocate();

518

dst.allocator()->allocate();

519

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

520

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

521

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

522

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

523

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

524

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

525

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

526

527

// Fill tensors

528

fill(AccessorType(lhs), 0);

529

fill(AccessorType(rhs), 1);

530

fill(AccessorType(bias), 2);

531

532

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

533

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

534

reshape_lhs.run(reshape_lhs_pack);

535

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

536

reshape_rhs.run(reshape_rhs_pack);

537

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

538

{ ACL_SRC_1, &rhs_reshaped },

539

{ ACL_SRC_2, &bias },

540

{ ACL_DST, &dst }

541

});

542

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

547

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

548

const ActivationLayerInfo &act_info)

549

{

550

TensorShape dst_shape = lhs_shape;

551

dst_shape[0] = rhs_shape[0];

552

dst_shape[1] = lhs_shape[1];

553

554

// Create reference

555

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

556

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

557

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

558

559

const int n = rhs_shape[0];

560

const int m = lhs_shape[1];

561

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

571

for(int i = 1; i < m * batch_size; i++)

572

{

573

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

578

}

579

580

TensorType _target{};

581

SimpleTensor<T> _reference{};

582

};

583

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

584

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

585

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

586

{

587

public:

588

template <typename...>

589

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

590

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

591

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

592

ARM_COMPUTE_UNUSED(broadcast_bias);

593

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

594

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

599

lhs_info.transpose = true;

600

601

GEMMRHSMatrixInfo rhs_info;

602

rhs_info.n0 = 16 / sizeof(T);

603

rhs_info.k0 = 1;

604

rhs_info.h0 = h0;

605

rhs_info.interleave = false;

606

rhs_info.transpose = false;

607

608

// In case of GEMM3D, m is the product between m_w and m_h

609

const unsigned int m = m_w * m_h;

610

611

// Set the tensor shapes for LHS and RHS matrices

612

const TensorShape lhs_shape(k, m, batch_size);

613

const TensorShape rhs_shape(n, k, batch_size);

614

const TensorShape bias_shape(n, 1, 1);

615

616

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

617

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

622

void fill(U &&tensor, int i)

623

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

624

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

625

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

626

627

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

628

library->fill(tensor, distribution, i);

629

}

630

631

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

632

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

633

{

634

// Create tensors

635

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

636

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

637

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

638

TensorType lhs_reshaped;

639

TensorType rhs_reshaped;

640

TensorType dst;

641

642

const unsigned int m = lhs_shape[1];

643

const unsigned int n = rhs_shape[0];

644

const unsigned int k = lhs_shape[0];

645

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

646

647

// The output tensor will be auto-initialized within the function

648

649

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

650

ReshapeLHSOperatorType reshape_lhs;

651

ReshapeRHSOperatorType reshape_rhs;

652

GEMMOperatorType gemm;

653

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

654

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

655

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

656

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

657

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

658

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

659

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

660

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

661

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

662

if(!rhs_info.export_to_cl_image)

663

{

664

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

665

}

666

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

667

// Allocate tensors

668

lhs.allocator()->allocate();

669

rhs.allocator()->allocate();

670

lhs_reshaped.allocator()->allocate();

671

rhs_reshaped.allocator()->allocate();

672

bias.allocator()->allocate();

673

dst.allocator()->allocate();

674

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

675

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

676

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

677

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

678

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

679

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

680

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

681

682

// Fill tensors

683

fill(AccessorType(lhs), 0);

684

fill(AccessorType(rhs), 1);

685

fill(AccessorType(bias), 2);

686

687

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

688

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

689

reshape_lhs.run(reshape_lhs_pack);

690

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

691

reshape_rhs.run(reshape_rhs_pack);

692

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

693

{ ACL_SRC_1, &rhs_reshaped },

694

{ ACL_SRC_2, &bias },

695

{ ACL_DST, &dst }

696

});

697

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

702

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

703

const ActivationLayerInfo &act_info)

704

{

705

TensorShape dst_shape = lhs_shape;

706

dst_shape.set(0, rhs_shape[0]);

707

dst_shape.set(1, lhs_shape[1] / m_h);

708

dst_shape.set(2, m_h);

709

dst_shape.set(3, lhs_shape[2]);

710

711

// Create reference

712

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

713

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

714

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

715

716

const int n = rhs_shape[0];

717

const int m = lhs_shape[1];

718

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

726

for(int i = 1; i < m * batch_size; i++)

727

{

728

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

729

}

730

731

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

732

}

733

734

TensorType _target{};

735

SimpleTensor<T> _reference{};

736

};

737

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

738

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

739

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

740

{

741

public:

742

template <typename...>

743

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

744

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

745

{

746

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

751

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

752

753

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

758

rhs_info.transpose = !lhs_transpose;

759

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

760

761

// Set the tensor shapes for LHS and RHS matrices

762

const TensorShape lhs_shape(k, m, batch_size);

763

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

764

const TensorShape bias_shape(n,

765

broadcast_bias ? 1 : m,

766

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

767

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

768

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

769

if(validate_result)

770

{

771

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

772

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

777

void fill(U &&tensor, int i)

778

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

779

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

780

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

781

782

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

783

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

784

785

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

786

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

787

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

788

}

789

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

790

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

791

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

792

{

793

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

794

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

795

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

796

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

797

TensorType lhs_reshaped;

798

TensorType rhs_reshaped;

799

TensorType dst;

800

801

const unsigned int M = lhs_shape[1];

802

const unsigned int N = rhs_shape[0];

803

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

804

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

809

kernel_info.reinterpret_input_as_3d = false;

810

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

811

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

812

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

813

814

// The output tensor will be auto-initialized within the function

815

816

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

817

ReshapeLHSOperatorType reshape_lhs;

818

ReshapeRHSOperatorType reshape_rhs;

819

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

820

821

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

822

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

828

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

829

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

830

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

831

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

832

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

833

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

834

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

835

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

836

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

837

if(!rhs_info.export_to_cl_image)

838

{

839

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

840

}

841

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

842

// Allocate tensors

843

lhs.allocator()->allocate();

844

rhs.allocator()->allocate();

845

lhs_reshaped.allocator()->allocate();

846

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

847

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

848

dst.allocator()->allocate();

849

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

850

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

851

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

852

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

853

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

854

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

855

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

856

857

// Fill tensors

858

fill(AccessorType(lhs), 0);

859

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

860

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

861

862

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

863

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

864

reshape_lhs.run(reshape_lhs_pack);

865

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

866

reshape_rhs.run(reshape_rhs_pack);

867

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

868

{ ACL_SRC_1, &rhs_reshaped },

869

{ ACL_SRC_2, &bias },

870

{ ACL_DST, &dst }

871

});

872

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

877

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

878

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

879

{

880

TensorShape dst_shape = lhs_shape;

881

dst_shape[0] = rhs_shape[0];

882

dst_shape[1] = lhs_shape[1];

883

884

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

885

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

886

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

887

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

888

889

const int n = rhs_shape[0];

890

const int m = lhs_shape[1];

891

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

896

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

897

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

898

if(broadcast_bias)

899

{

900

// In case of broadcast, we need simply copy the first into the following "M" ones

901

for(int i = 1; i < m * batch_size; i++)

902

{

903

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

907

if(fp_mixed_precision)

908

{

909

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

914

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

915

}

916

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

917

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

918

TensorType _target{};

919

SimpleTensor<T> _reference{};

920

};

921

SiCongLi

1af5416

2021-10-06 15:25:57 +0100

[diff] [blame]

922

/** (EXPERIMENTAL_POST_OPS)*/

923

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

924

class GEMMMatrixMultiplyReshapedWithPostOpsValidationFixture : public framework::Fixture

925

{

926

public:

927

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

928

public:

929

template <typename...>

930

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

931

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info,

932

const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

933

{

934

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

939

lhs_info.transpose = lhs_transpose;

940

941

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

946

rhs_info.transpose = !lhs_transpose;

947

rhs_info.export_to_cl_image = export_to_cl_image;

948

949

// Set the tensor shapes for LHS and RHS matrices

950

const TensorShape lhs_shape(k, m, batch_size);

951

const TensorShape rhs_shape(n, k, batch_size);

952

const TensorShape bias_shape(n,

953

broadcast_bias ? 1 : m,

954

broadcast_bias ? 1 : batch_size);

955

auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

956

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

961

std::get<1>(broadcast) ? 1 : m,

962

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

967

if(validate_result)

968

{

969

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

}

protected:

template <typename U>

975

void fill(U &&tensor, int i)

976

{

977

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

978

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

979

980

DistributionType distribution{ T(-1.0f), T(1.0f) };

981

library->fill(tensor, distribution, i);

982

983

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

984

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

985

library->fill_borders_with_garbage(tensor, distribution_inf, i);

986

}

987

988

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

989

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

990

{

991

// Create tensors

992

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

993

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

994

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

995

996

// Create post op tensors and populate post op with them

997

std::vector<TensorType> post_op_tensors_holder{};

998

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

999

[&post_op_tensors_holder, &data_type](auto shape)

1000

{

1001

auto t = create_tensor<TensorType>(shape, data_type, 1);

1002

post_op_tensors_holder.push_back(std::move(t));

1003

return post_op_tensors_holder.back().info();

1004

});

1005

TensorType lhs_reshaped;

1006

TensorType rhs_reshaped;

1007

TensorType dst;

1008

1009

const unsigned int M = lhs_shape[1];

1010

const unsigned int N = rhs_shape[0];

1011

const unsigned int K = lhs_shape[0];

1012

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1017

kernel_info.reinterpret_input_as_3d = false;

1018

kernel_info.broadcast_bias = broadcast_bias;

1019

kernel_info.activation_info = act_info;

1020

kernel_info.fp_mixed_precision = fp_mixed_precision;

1021

kernel_info.post_ops = populated_post_ops;

1022

1023

// The output tensor will be auto-initialized within the function

1024

1025

// Create and configure function

1026

ReshapeLHSOperatorType reshape_lhs;

1027

ReshapeRHSOperatorType reshape_rhs;

1028

GEMMOperatorType gemm;

1029

1030

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1031

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1038

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1039

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

1040

1041

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1042

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1043

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1044

for(const auto &tensor : post_op_tensors_holder)

1045

{

1046

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

1047

}

1048

1049

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

1050

if(!rhs_info.export_to_cl_image)

1051

{

1052

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1053

for(auto &tensor : post_op_tensors_holder)

1054

{

1055

add_padding_x({ &tensor });

}

}

// Allocate tensors

lhs.allocator()->allocate();

1061

rhs.allocator()->allocate();

1062

lhs_reshaped.allocator()->allocate();

1063

rhs_reshaped.allocator()->allocate();

1064

bias.allocator()->allocate();

1065

dst.allocator()->allocate();

1066

for(auto &tensor : post_op_tensors_holder)

1067

{

1068

tensor.allocator()->allocate();

1069

}

1070

1071

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1072

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1073

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1074

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1075

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1076

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1077

for(const auto &tensor : post_op_tensors_holder)

1078

{

1079

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

1084

fill(AccessorType(rhs), 1);

1085

fill(AccessorType(bias), 2);

1086

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1087

{

1088

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1093

reshape_lhs.run(reshape_lhs_pack);

1094

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1095

reshape_rhs.run(reshape_rhs_pack);

1096

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1097

{ ACL_SRC_1, &rhs_reshaped },

1098

{ ACL_SRC_2, &bias },

1099

{ ACL_DST, &dst }

1100

});

1101

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1102

{

1103

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1111

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1112

{

1113

TensorShape dst_shape = lhs_shape;

1114

dst_shape[0] = rhs_shape[0];

1115

dst_shape[1] = lhs_shape[1];

1116

1117

// Create reference

1118

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1119

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1120

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1121

// Create post op tensors and populate post op with them

1122

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

1123

{

1124

return SimpleTensor<T> { shape, data_type, 1 };

1125

});

1126

1127

const int n = rhs_shape[0];

1128

const int m = lhs_shape[1];

1129

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

1134

fill(rhs, tensor_idx++);

1135

fill(bias, tensor_idx++);

1136

for(auto &op : populated_post_ops.get_list())

1137

{

1138

for(auto tensor : op->arguments())

1139

{

1140

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

1147

for(int i = 1; i < m * batch_size; i++)

1148

{

1149

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

if(fp_mixed_precision)

1155

{

1156

out = reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta);

}

else

{

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

1161

}

1162

// Ignore activation info if post ops are used instead

1163

if(populated_post_ops.size() > 0)

1164

{

1165

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

bool validate_result = true;

1175

TensorType _target{};

1176

SimpleTensor<T> _reference{};

1177

};

1178

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1179

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1180

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

1181

{

1182

public:

1183

template <typename...>

1184

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

1185

bool interleave_lhs, bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1186

{

1187

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

1192

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1193

1194

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1199

rhs_info.transpose = !lhs_transpose;

1200

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1201

1202

// In case of GEMM3D, m is the product between m_w and m_h

1203

const unsigned int m = m_w * m_h;

1204

1205

// Set the tensor shapes for LHS and RHS matrices

1206

const TensorShape lhs_shape(k, m, batch_size);

1207

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1208

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1209

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1210

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

1211

if(validate_result)

1212

{

1213

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1214

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

1219

void fill(U &&tensor, int i)

1220

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1221

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1222

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1223

1224

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1225

library->fill(tensor, distribution, i);

1226

}

1227

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1228

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1229

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1230

{

1231

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1232

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1233

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1234

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1235

TensorType lhs_reshaped;

1236

TensorType rhs_reshaped;

1237

TensorType dst;

1238

1239

const unsigned int M = lhs_shape[1];

1240

const unsigned int N = rhs_shape[0];

1241

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1242

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1247

kernel_info.reinterpret_input_as_3d = false;

1248

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1249

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1250

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1251

1252

// The output tensor will be auto-initialized within the function

1253

1254

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1255

ReshapeLHSOperatorType reshape_lhs;

1256

ReshapeRHSOperatorType reshape_rhs;

1257

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1258

1259

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1260

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1266

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1267

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1268

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1269

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1270

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1271

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1272

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1273

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1274

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1275

if(!rhs_info.export_to_cl_image)

1276

{

1277

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1278

}

1279

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1280

// Allocate tensors

1281

lhs.allocator()->allocate();

1282

rhs.allocator()->allocate();

1283

lhs_reshaped.allocator()->allocate();

1284

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1285

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1286

dst.allocator()->allocate();

1287

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1288

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1289

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1290

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1291

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1292

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1293

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1294

1295

// Fill tensors

1296

fill(AccessorType(lhs), 0);

1297

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1298

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1299

1300

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1301

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1302

reshape_lhs.run(reshape_lhs_pack);

1303

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1304

reshape_rhs.run(reshape_rhs_pack);

1305

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1306

{ ACL_SRC_1, &rhs_reshaped },

1307

{ ACL_SRC_2, &bias },

1308

{ ACL_DST, &dst }

1309

});

1310

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1315

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1316

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1317

{

1318

TensorShape dst_shape = lhs_shape;

1319

dst_shape.set(0, rhs_shape[0]);

1320

dst_shape.set(1, lhs_shape[1] / m_h);

1321

dst_shape.set(2, m_h);

1322

dst_shape.set(3, lhs_shape[2]);

1323

1324

// Create reference

1325

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1326

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1327

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1328

1329

const int n = rhs_shape[0];

1330

const int m = lhs_shape[1];

1331

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1336

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1337

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1338

// In case of broadcast, we need simply copy the first into the following "M" ones

1339

for(int i = 1; i < m * batch_size; i++)

1340

{

1341

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1342

}

1343

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1344

if(fp_mixed_precision)

1345

{

1346

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

1351

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1352

}

1353

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1354

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1355

TensorType _target{};

1356

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

1357

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1358

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1359

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1360

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1361

{

1362

public:

1363

template <typename...>

1364

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

1365

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1366

{

1367

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1376

rhs_info.transpose = transpose_rhs;

1377

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1378

1379

// Set the tensor shapes for LHS and RHS matrices

1380

const TensorShape lhs_shape(k, m, batch_size);

1381

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1382

const TensorShape bias_shape(n,

1383

broadcast_bias ? 1 : m,

1384

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1385

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1386

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1387

if(validate_result)

1388

{

1389

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

1390

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1395

void fill(U &&tensor, int i)

1396

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1397

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1398

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1399

1400

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1401

library->fill(tensor, distribution, i);

1402

1403

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1404

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1405

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1406

}

1407

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1408

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1409

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1410

{

1411

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1412

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1413

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1414

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1415

TensorType rhs_reshaped;

1416

TensorType dst;

1417

1418

const unsigned int M = lhs_shape[1];

1419

const unsigned int N = rhs_shape[0];

1420

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1421

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1426

kernel_info.reinterpret_input_as_3d = false;

1427

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1428

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1429

1430

// The output tensor will be auto-initialized within the function

1431

1432

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1433

ReshapeRHSOperatorType reshape_rhs;

1434

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1435

1436

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1437

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1443

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1444

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1445

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1446

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1447

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1448

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1449

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1450

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1451

if(!rhs_info.export_to_cl_image)

1452

{

1453

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1454

}

1455

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1456

// Allocate tensors

1457

lhs.allocator()->allocate();

1458

rhs.allocator()->allocate();

1459

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1460

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1461

dst.allocator()->allocate();

1462

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1463

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1464

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1465

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1466

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1467

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1468

1469

// Fill tensors

1470

fill(AccessorType(lhs), 0);

1471

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1472

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1473

1474

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1475

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1476

reshape_rhs.run(reshape_rhs_pack);

1477

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1478

{ ACL_SRC_1, &rhs_reshaped },

1479

{ ACL_SRC_2, &bias },

1480

{ ACL_DST, &dst }

1481

});

1482

gemm.run(gemm_pack);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1487

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1488

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1489

{

1490

TensorShape dst_shape = lhs_shape;

1491

dst_shape[0] = rhs_shape[0];

1492

dst_shape[1] = lhs_shape[1];

1493

1494

// Create reference

1495

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1496

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1497

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1498

1499

const int n = rhs_shape[0];

1500

const int m = lhs_shape[1];

1501

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1506

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1507

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1508

if(broadcast_bias)

1509

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1510

// In case of broadcast, we need simply copy the first into the following "M" ones

1511

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1512

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1513

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1514

}

1515

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1516

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1517

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1518

}

1519

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1520

bool validate_result = true;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1521

TensorType _target{};

1522

SimpleTensor<T> _reference{};

1523

};

1524

SiCongLi

afa1972

2021-10-24 19:12:33 +0100

[diff] [blame]

1525

/** (EXPERIMENTAL_POST_OPS)*/

1526

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

1527

class GEMMMatrixMultiplyReshapedOnlyRHSWithPostOpsValidationFixture : public framework::Fixture

1528

{

1529

public:

1530

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

1531

template <typename...>

1532

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

1533

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info,

1534

const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

1535

{

1536

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1545

rhs_info.transpose = transpose_rhs;

1546

rhs_info.export_to_cl_image = export_to_cl_image;

1547

1548

// Set the tensor shapes for LHS and RHS matrices

1549

const TensorShape lhs_shape(k, m, batch_size);

1550

const TensorShape rhs_shape(n, k, batch_size);

1551

const TensorShape bias_shape(n,

1552

broadcast_bias ? 1 : m,

1553

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

10e88a7

2021-11-29 12:49:19 +0000

[diff] [blame^]

1554

SiCongLi

afa1972

2021-10-24 19:12:33 +0100

[diff] [blame]

1555

auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

1556

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

1561

std::get<1>(broadcast) ? 1 : m,

1562

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

1567

if(validate_result)

1568

{

1569

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

}

protected:

template <typename U>

1575

void fill(U &&tensor, int i)

1576

{

1577

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

1578

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

1579

1580

DistributionType distribution{ T(-1.0f), T(1.0f) };

1581

library->fill(tensor, distribution, i);

1582

1583

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1584

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

1585

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1586

}

1587

1588

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1589

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1590

{

1591

// Create tensors

1592

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1593

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1594

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1595

TensorType rhs_reshaped;

1596

TensorType dst;

1597

// Create post op tensors and populate post op with them

1598

std::vector<TensorType> post_op_tensors_holder{};

1599

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

1600

[&post_op_tensors_holder, &data_type](auto shape)

1601

{

1602

auto t = create_tensor<TensorType>(shape, data_type, 1);

1603

post_op_tensors_holder.push_back(std::move(t));

1604

return post_op_tensors_holder.back().info();

1605

});

1606

1607

const unsigned int M = lhs_shape[1];

1608

const unsigned int N = rhs_shape[0];

1609

const unsigned int K = lhs_shape[0];

1610

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1615

kernel_info.reinterpret_input_as_3d = false;

1616

kernel_info.broadcast_bias = broadcast_bias;

1617

kernel_info.activation_info = act_info;

1618

kernel_info.post_ops = populated_post_ops;

1619

1620

// The output tensor will be auto-initialized within the function

1621

1622

// Create and configure function

1623

ReshapeRHSOperatorType reshape_rhs;

1624

GEMMOperatorType gemm;

1625

1626

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1627

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1634

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

1635

1636

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1637

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1638

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1639

for(const auto &tensor : post_op_tensors_holder)

1640

{

1641

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

1642

}

1643

1644

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

1645

if(!rhs_info.export_to_cl_image)

1646

{

1647

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1648

for(auto &tensor : post_op_tensors_holder)

1649

{

1650

add_padding_x({ &tensor });

}

}

// Allocate tensors

lhs.allocator()->allocate();

1656

rhs.allocator()->allocate();

1657

rhs_reshaped.allocator()->allocate();

1658

bias.allocator()->allocate();

1659

dst.allocator()->allocate();

1660

for(auto &tensor : post_op_tensors_holder)

1661

{

1662

tensor.allocator()->allocate();

1663

}

1664

1665

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1666

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1667

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1668

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1669

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1670

for(const auto &tensor : post_op_tensors_holder)

1671

{

1672

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

1677

fill(AccessorType(rhs), 1);

1678

fill(AccessorType(bias), 2);

1679

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1680

{

1681

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1686

reshape_rhs.run(reshape_rhs_pack);

1687

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1688

{ ACL_SRC_1, &rhs_reshaped },

1689

{ ACL_SRC_2, &bias },

1690

{ ACL_DST, &dst }

1691

});

1692

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1693

{

1694

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1702

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1703

{

1704

TensorShape dst_shape = lhs_shape;

1705

dst_shape[0] = rhs_shape[0];

1706

dst_shape[1] = lhs_shape[1];

1707

1708

// Create reference

1709

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1710

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1711

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1712

// Create post op tensors and populate post op with them

1713

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

1714

{

1715

return SimpleTensor<T> { shape, data_type, 1 };

1716

});

1717

1718

const int n = rhs_shape[0];

1719

const int m = lhs_shape[1];

1720

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

1725

fill(rhs, tensor_idx++);

1726

fill(bias, tensor_idx++);

1727

for(auto &op : populated_post_ops.get_list())

1728

{

1729

for(auto tensor : op->arguments())

1730

{

1731

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

1738

for(int i = 1; i < m * batch_size; i++)

1739

{

1740

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

1746

// Ignore activation info if post ops are used instead

1747

if(populated_post_ops.size() > 0)

1748

{

1749

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

bool validate_result = true;

1759

TensorType _target{};

1760

SimpleTensor<T> _reference{};

1761

};

1762

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1763

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1764

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1765

{

1766

public:

1767

template <typename...>

1768

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1769

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, bool has_pad_y, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1770

{

1771

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1780

rhs_info.transpose = transpose_rhs;

1781

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1782

1783

// In case of GEMM3D, m is the product between m_w and m_h

1784

const unsigned int m = m_w * m_h;

1785

1786

// Set the tensor shapes for LHS and RHS matrices

1787

const TensorShape lhs_shape(k, m, batch_size);

1788

const TensorShape rhs_shape(n, k, batch_size);

1789

const TensorShape bias_shape(n, 1, 1);

1790

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1791

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info, has_pad_y);

1792

if(validate_result)

1793

{

1794

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1795

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1800

void fill(U &&tensor, int i)

1801

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1802

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1803

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1804

1805

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1806

library->fill(tensor, distribution, i);

1807

}

1808

1809

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1810

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1811

unsigned int m_h, const ActivationLayerInfo &act_info, bool has_pad_y)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1812

{

1813

// Create tensors

1814

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1815

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1816

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1817

TensorType rhs_reshaped;

1818

TensorType dst;

1819

1820

const unsigned int M = lhs_shape[1];

1821

const unsigned int N = rhs_shape[0];

1822

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1823

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1828

kernel_info.reinterpret_input_as_3d = false;

1829

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1830

kernel_info.activation_info = act_info;

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1831

kernel_info.has_pad_y = has_pad_y;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1832

1833

// The output tensor will be auto-initialized within the function

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1834

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1835

ReshapeRHSOperatorType reshape_rhs;

1836

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1837

1838

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1839

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1845

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1846

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1847

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1848

if(has_pad_y)

1849

{

1850

// Add dummy padding into lhs to validate has_pad_y path

1851

lhs.info()->extend_padding(PaddingSize(2, 0, 2, 0));

1852

dst.info()->extend_padding(PaddingSize(2, 0, 1, 0));

1853

}

1854

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1855

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1856

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1857

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1858

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1859

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1860

if(!rhs_info.export_to_cl_image)

1861

{

1862

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1863

}

1864

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1865

// Allocate tensors

1866

lhs.allocator()->allocate();

1867

rhs.allocator()->allocate();

1868

rhs_reshaped.allocator()->allocate();

1869

bias.allocator()->allocate();

1870

dst.allocator()->allocate();

1871

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1872

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1873

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1874

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1875

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1876

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1877

1878

// Fill tensors

1879

fill(AccessorType(lhs), 0);

1880

fill(AccessorType(rhs), 1);

1881

fill(AccessorType(bias), 2);

1882

1883

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1884

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1885

reshape_rhs.run(reshape_rhs_pack);

1886

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1887

{ ACL_SRC_1, &rhs_reshaped },

1888

{ ACL_SRC_2, &bias },

1889

{ ACL_DST, &dst }

1890

});

1891

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1896

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1897

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1898

{

1899

TensorShape dst_shape = lhs_shape;

1900

dst_shape.set(0, rhs_shape[0]);

1901

dst_shape.set(1, lhs_shape[1] / m_h);

1902

dst_shape.set(2, m_h);

1903

dst_shape.set(3, lhs_shape[2]);

1904

1905

// Create reference

1906

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1907

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1908

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1909

1910

const int n = rhs_shape[0];

1911

const int m = lhs_shape[1];

1912

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

1920

for(int i = 1; i < m * batch_size; i++)

1921

{

1922

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1923

}

1924

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1925

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1926

}

1927

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1928

bool validate_result = true;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1929

TensorType _target{};

1930

SimpleTensor<T> _reference{};

1931

};

1932

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1933

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1934

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1935

{

1936

public:

1937

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1938

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1939

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1940

{

1941

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1950

const TensorShape lhs_shape(k, m, batch_size);

1951

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1952

const TensorShape bias_shape(n,

1953

broadcast_bias ? 1 : m,

1954

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1955

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1956

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1957

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1962

void fill(U &&tensor, int i)

1963

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1964

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1965

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1966

1967

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1968

library->fill(tensor, distribution, i);

1969

1970

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1971

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1972

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1973

}

1974

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1975

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1976

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1977

{

1978

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1979

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1980

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1981

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1982

TensorType dst;

1983

1984

const unsigned int M = lhs_shape[1];

1985

const unsigned int N = rhs_shape[0];

1986

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1987

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1992

kernel_info.reinterpret_input_as_3d = false;

1993

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1994

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1995

1996

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1997

GEMMOperatorType gemm;

1998

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1999

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2000

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2001

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2002

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2003

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2004

add_padding_x({ &lhs, &rhs, &bias, &dst });

2005

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2006

// Allocate tensors

2007

lhs.allocator()->allocate();

2008

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2009

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2010

dst.allocator()->allocate();

2011

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2012

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2013

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2014

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2015

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2016

2017

// Fill tensors

2018

fill(AccessorType(lhs), 0);

2019

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2020

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2021

2022

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2023

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2024

{ ACL_SRC_1, &rhs },

2025

{ ACL_SRC_2, &bias },

2026

{ ACL_DST, &dst }

2027

});

2028

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2033

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2034

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2035

{

2036

TensorShape dst_shape = lhs_shape;

2037

dst_shape[0] = rhs_shape[0];

2038

dst_shape[1] = lhs_shape[1];

2039

2040

// Create reference

2041

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2042

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2043

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2044

2045

const int n = rhs_shape[0];

2046

const int m = lhs_shape[1];

2047

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2052

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2053

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2054

if(broadcast_bias)

2055

{

2056

// In case of broadcast, we need simply copy the first into the following "M" ones

2057

for(int i = 1; i < m * batch_size; i++)

2058

{

2059

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2063

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2064

}

2065

2066

TensorType _target{};

2067

SimpleTensor<T> _reference{};

2068

};

2069

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2070

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

SiCongLi

afa1972

2021-10-24 19:12:33 +0100

[diff] [blame]

2071

class GEMMMatrixMultiplyNativeWithPostOpsValidationFixture : public framework::Fixture

2072

{

2073

public:

2074

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

2075

public:

2076

template <typename...>

2077

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

2078

const ActivationLayerInfo &act_info, const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

2079

{

2080

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

2089

const TensorShape lhs_shape(k, m, batch_size);

2090

const TensorShape rhs_shape(n, k, batch_size);

2091

const TensorShape bias_shape(n,

2092

broadcast_bias ? 1 : m,

2093

broadcast_bias ? 1 : batch_size);

2094

const auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

2095

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

2100

std::get<1>(broadcast) ? 1 : m,

2101

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

2106

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

protected:

template <typename U>

2111

void fill(U &&tensor, int i)

2112

{

2113

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

2114

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

2115

2116

DistributionType distribution{ T(-1.0f), T(1.0f) };

2117

library->fill(tensor, distribution, i);

2118

2119

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

2120

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

2121

library->fill_borders_with_garbage(tensor, distribution_inf, i);

2122

}

2123

2124

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

2125

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

2126

{

2127

// Create tensors

2128

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2129

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2130

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

2131

TensorType dst;

2132

// Create post op tensors and populate post op with them

2133

std::vector<TensorType> post_op_tensors_holder{};

2134

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

2135

[&post_op_tensors_holder, &data_type](auto shape)

2136

{

2137

auto t = create_tensor<TensorType>(shape, data_type, 1);

2138

post_op_tensors_holder.push_back(std::move(t));

2139

return post_op_tensors_holder.back().info();

2140

});

2141

2142

const unsigned int M = lhs_shape[1];

2143

const unsigned int N = rhs_shape[0];

2144

const unsigned int K = lhs_shape[0];

2145

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

2150

kernel_info.reinterpret_input_as_3d = false;

2151

kernel_info.broadcast_bias = broadcast_bias;

2152

kernel_info.activation_info = act_info;

2153

kernel_info.post_ops = populated_post_ops;

2154

2155

// Create and configure function

2156

GEMMOperatorType gemm;

2157

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

2158

2159

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2160

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2161

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

2162

for(const auto &tensor : post_op_tensors_holder)

2163

{

2164

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

2165

}

2166

2167

add_padding_x({ &lhs, &rhs, &bias, &dst });

2168

for(auto &tensor : post_op_tensors_holder)

2169

{

2170

add_padding_x({ &tensor });

}

// Allocate tensors

lhs.allocator()->allocate();

2175

rhs.allocator()->allocate();

2176

bias.allocator()->allocate();

2177

dst.allocator()->allocate();

2178

for(auto &tensor : post_op_tensors_holder)

2179

{

2180

tensor.allocator()->allocate();

2181

}

2182

2183

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2184

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2185

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2186

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

2187

for(const auto &tensor : post_op_tensors_holder)

2188

{

2189

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

2194

fill(AccessorType(rhs), 1);

2195

fill(AccessorType(bias), 2);

2196

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

2197

{

2198

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2203

{ ACL_SRC_1, &rhs },

2204

{ ACL_SRC_2, &bias },

2205

{ ACL_DST, &dst }

2206

});

2207

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

2208

{

2209

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

2217

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

2218

{

2219

TensorShape dst_shape = lhs_shape;

2220

dst_shape[0] = rhs_shape[0];

2221

dst_shape[1] = lhs_shape[1];

2222

2223

// Create reference

2224

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2225

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

2226

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2227

// Create post op tensors and populate post op with them

2228

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

2229

{

2230

return SimpleTensor<T> { shape, data_type, 1 };

2231

});

2232

2233

const int n = rhs_shape[0];

2234

const int m = lhs_shape[1];

2235

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

2240

fill(rhs, tensor_idx++);

2241

fill(bias, tensor_idx++);

2242

for(auto &op : populated_post_ops.get_list())

2243

{

2244

for(auto tensor : op->arguments())

2245

{

2246

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

2253

for(int i = 1; i < m * batch_size; i++)

2254

{

2255

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

2261

// Ignore activation info if post ops are used instead

2262

if(populated_post_ops.size() > 0)

2263

{

2264

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

TensorType _target{};

2274

SimpleTensor<T> _reference{};

2275

};

2276

2277

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2278

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

2279

{

2280

public:

2281

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2282

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

2283

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2284

{

2285

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

2294

const unsigned int m = m_w * m_h;

2295

2296

// Set the tensor shapes for LHS and RHS matrices

2297

const TensorShape lhs_shape(k, m, batch_size);

2298

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2299

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2300

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2301

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2302

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

2307

void fill(U &&tensor, int i)

2308

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2309

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

2310

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2311

2312

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2313

library->fill(tensor, distribution, i);

2314

}

2315

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2316

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2317

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2318

{

2319

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2320

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2321

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2322

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2323

TensorType dst;

2324

2325

const unsigned int M = lhs_shape[1];

2326

const unsigned int N = rhs_shape[0];

2327

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

2328

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

2333

kernel_info.reinterpret_input_as_3d = false;

2334

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2335

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2336

2337

// The output tensor will be auto-initialized within the function

2338

2339

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2340

GEMMOperatorType gemm;

2341

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2342

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2343

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2344

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2345

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2346

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2347

add_padding_x({ &lhs, &rhs, &bias, &dst });

2348

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2349

// Allocate tensors

2350

lhs.allocator()->allocate();

2351

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2352

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2353

dst.allocator()->allocate();

2354

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2355

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2356

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2357

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2358

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2359

2360

// Fill tensors

2361

fill(AccessorType(lhs), 0);

2362

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2363

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2364

2365

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2366

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2367

{ ACL_SRC_1, &rhs },

2368

{ ACL_SRC_2, &bias },

2369

{ ACL_DST, &dst }

2370

});

2371

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2376

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2377

const ActivationLayerInfo &act_info)

giuros01