Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

48

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

49

{

50

public:

51

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

52

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

54

ARM_COMPUTE_UNUSED(pretranspose);

55

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

56

_reference = compute_reference(shape_a, shape_b, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

61

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

62

{

63

switch(tensor.data_type())

64

{

65

case DataType::F16:

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

66

{

Giorgio Arena

a8e2aeb

2021-01-06 11:34:57 +0000

[diff] [blame]

67

arm_compute::utils::uniform_real_distribution_16bit<half> distribution{ float(lo), float(hi) };

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

68

library->fill(tensor, distribution, i);

69

break;

70

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

71

case DataType::F32:

72

{

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

73

std::uniform_real_distribution<float> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

74

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

83

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

84

{

85

// Create tensors

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

86

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

87

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

88

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

89

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

90

91

// Create and configure function

92

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

93

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

94

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

95

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

96

gemm.configure(&a,

97

&b,

98

(disable_c) ? nullptr : &c,

99

&dst,

100

alpha, beta,

Georgios Pinitas

4ee8b15

2021-07-16 16:16:43 +0100

[diff] [blame]

101

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, false, (reinterpret_input_as_3d

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

102

|| reinterpret_output_as_3d)));

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

103

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

104

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

105

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

106

ARM_COMPUTE_ASSERT(dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

107

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

108

add_padding_x({ &a, &b, &c, &dst });

109

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

110

// Allocate tensors

111

a.allocator()->allocate();

112

b.allocator()->allocate();

113

c.allocator()->allocate();

114

dst.allocator()->allocate();

115

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

116

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

117

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

118

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

119

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

120

121

// Fill tensors

122

fill(AccessorType(a), 0);

123

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

124

if(!disable_c)

125

{

126

fill(AccessorType(c), 2);

127

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

128

129

// Compute GEMM function

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

135

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

136

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

137

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

138

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

139

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

140

if(reinterpret_input_as_3d)

141

{

142

// Collapse the second and third dimension if the input is 3D

143

shape_a_to_use.collapse(2U, 1U);

144

}

145

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

146

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

147

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

148

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

149

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

154

fill(c, 2);

155

156

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

157

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

158

const int n = shape_b[0];

159

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

160

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

161

162

// In case of broadcast, we need simply copy the first into the following "M" ones

163

for(int i = 1; i < m * batch_size; i++)

164

{

165

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

166

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

167

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

168

169

// Setting beta to 0 will effectively disable C for the

170

// computation of the reference: alpha * A * B + 0 * C

171

return reference::gemm<T>(a, b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

172

}

173

174

TensorType _target{};

175

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

176

};

177

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

178

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

179

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

180

{

181

public:

182

template <typename...>

183

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

184

DataType data_type, GPUTarget gpu_arch)

185

{

186

// Set the tensor shapes for LHS and RHS matrices

187

const TensorShape lhs_shape(k, m, batch_size);

188

const TensorShape rhs_shape(n, k, batch_size);

189

const TensorShape bias_shape(n,

190

broadcast_bias ? 1 : m,

191

broadcast_bias ? 1 : batch_size);

192

193

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

194

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

199

void fill(U &&tensor, int i)

200

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

201

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

202

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

203

204

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

205

library->fill(tensor, distribution, i);

206

207

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

208

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

209

library->fill_borders_with_garbage(tensor, distribution_inf, i);

210

}

211

212

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

213

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

214

{

215

// Create tensors

216

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

217

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

218

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

219

TensorType dst;

220

221

const unsigned int m = lhs_shape[1];

222

const unsigned int n = rhs_shape[0];

223

const unsigned int k = lhs_shape[0];

224

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

225

226

// The output tensor will be auto-initialized within the function

227

228

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

229

GEMMOperatorType gemm;

230

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

231

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

232

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

233

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

234

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

235

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

236

add_padding_x({ &lhs, &rhs, &bias, &dst });

237

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

238

// Allocate tensors

239

lhs.allocator()->allocate();

240

rhs.allocator()->allocate();

241

bias.allocator()->allocate();

242

dst.allocator()->allocate();

243

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

244

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

245

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

246

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

247

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

248

249

// Fill tensors

250

fill(AccessorType(lhs), 0);

251

fill(AccessorType(rhs), 1);

252

fill(AccessorType(bias), 2);

253

254

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

255

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

256

{ ACL_SRC_1, &rhs },

257

{ ACL_SRC_2, &bias },

258

{ ACL_DST, &dst }

259

});

260

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

265

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

266

const ActivationLayerInfo &act_info)

267

{

268

TensorShape dst_shape = lhs_shape;

269

dst_shape[0] = rhs_shape[0];

270

dst_shape[1] = lhs_shape[1];

271

272

// Create reference

273

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

274

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

275

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

276

277

const int n = rhs_shape[0];

278

const int m = lhs_shape[1];

279

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

289

for(int i = 1; i < m * batch_size; i++)

290

{

291

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

296

}

297

298

TensorType _target{};

299

SimpleTensor<T> _reference{};

300

};

301

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

302

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

303

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

304

{

305

public:

306

template <typename...>

307

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

308

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

309

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

310

ARM_COMPUTE_UNUSED(broadcast_bias);

311

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

312

// In case of GEMM3D, m is the product between m_w and m_h

313

const unsigned int m = m_w * m_h;

314

315

// Set the tensor shapes for LHS and RHS matrices

316

const TensorShape lhs_shape(k, m, batch_size);

317

const TensorShape rhs_shape(n, k, batch_size);

318

const TensorShape bias_shape(n, 1, 1);

319

320

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

321

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

326

void fill(U &&tensor, int i)

327

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

328

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

329

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

330

331

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

332

library->fill(tensor, distribution, i);

333

}

334

335

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

336

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

337

{

338

// Create tensors

339

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

340

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

341

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

342

TensorType dst;

343

344

const unsigned int m = lhs_shape[1];

345

const unsigned int n = rhs_shape[0];

346

const unsigned int k = lhs_shape[0];

347

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

348

349

// The output tensor will be auto-initialized within the function

350

351

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

352

GEMMOperatorType gemm;

353

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

354

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

355

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

356

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

357

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

358

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

359

add_padding_x({ &lhs, &rhs, &bias, &dst });

360

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

361

// Allocate tensors

362

lhs.allocator()->allocate();

363

rhs.allocator()->allocate();

364

bias.allocator()->allocate();

365

dst.allocator()->allocate();

366

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

367

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

368

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

369

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

370

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

371

372

// Fill tensors

373

fill(AccessorType(lhs), 0);

374

fill(AccessorType(rhs), 1);

375

fill(AccessorType(bias), 2);

376

377

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

378

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

379

{ ACL_SRC_1, &rhs },

380

{ ACL_SRC_2, &bias },

381

{ ACL_DST, &dst }

382

});

383

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

388

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

389

const ActivationLayerInfo &act_info)

390

{

391

TensorShape dst_shape = lhs_shape;

392

dst_shape.set(0, rhs_shape[0]);

393

dst_shape.set(1, lhs_shape[1] / m_h);

394

dst_shape.set(2, m_h);

395

dst_shape.set(3, lhs_shape[2]);

396

397

// Create reference

398

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

399

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

400

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

401

402

const int n = rhs_shape[0];

403

const int m = lhs_shape[1];

404

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

412

for(int i = 1; i < m * batch_size; i++)

413

{

414

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

415

}

416

417

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

418

}

419

420

TensorType _target{};

421

SimpleTensor<T> _reference{};

422

};

423

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

424

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

425

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

426

{

427

public:

428

template <typename...>

429

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

430

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

431

{

432

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

437

lhs_info.transpose = true;

438

439

GEMMRHSMatrixInfo rhs_info;

440

rhs_info.n0 = 16 / sizeof(T);

441

rhs_info.k0 = 1;

442

rhs_info.h0 = h0;

443

rhs_info.interleave = false;

444

rhs_info.transpose = false;

445

446

// Set the tensor shapes for LHS and RHS matrices

447

const TensorShape lhs_shape(k, m, batch_size);

448

const TensorShape rhs_shape(n, k, batch_size);

449

const TensorShape bias_shape(n,

450

broadcast_bias ? 1 : m,

451

broadcast_bias ? 1 : batch_size);

452

453

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

454

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

459

void fill(U &&tensor, int i)

460

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

461

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

462

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

463

464

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

465

library->fill(tensor, distribution, i);

466

467

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

468

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

469

library->fill_borders_with_garbage(tensor, distribution_inf, i);

470

}

471

472

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

473

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

474

{

475

// Create tensors

476

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

477

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

478

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

479

TensorType lhs_reshaped;

480

TensorType rhs_reshaped;

481

TensorType dst;

482

483

const unsigned int m = lhs_shape[1];

484

const unsigned int n = rhs_shape[0];

485

const unsigned int k = lhs_shape[0];

486

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

487

488

// The output tensor will be auto-initialized within the function

489

490

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

491

ReshapeLHSOperatorType reshape_lhs;

492

ReshapeRHSOperatorType reshape_rhs;

493

GEMMOperatorType gemm;

494

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

495

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

496

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

497

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

498

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

499

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

500

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

501

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

502

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

503

if(!rhs_info.export_to_cl_image)

504

{

505

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

506

}

507

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

508

// Allocate tensors

509

lhs.allocator()->allocate();

510

rhs.allocator()->allocate();

511

lhs_reshaped.allocator()->allocate();

512

rhs_reshaped.allocator()->allocate();

513

bias.allocator()->allocate();

514

dst.allocator()->allocate();

515

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

516

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

517

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

518

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

519

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

520

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

521

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

522

523

// Fill tensors

524

fill(AccessorType(lhs), 0);

525

fill(AccessorType(rhs), 1);

526

fill(AccessorType(bias), 2);

527

528

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

529

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

530

reshape_lhs.run(reshape_lhs_pack);

531

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

532

reshape_rhs.run(reshape_rhs_pack);

533

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

534

{ ACL_SRC_1, &rhs_reshaped },

535

{ ACL_SRC_2, &bias },

536

{ ACL_DST, &dst }

537

});

538

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

543

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

544

const ActivationLayerInfo &act_info)

545

{

546

TensorShape dst_shape = lhs_shape;

547

dst_shape[0] = rhs_shape[0];

548

dst_shape[1] = lhs_shape[1];

549

550

// Create reference

551

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

552

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

553

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

554

555

const int n = rhs_shape[0];

556

const int m = lhs_shape[1];

557

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

// In case of broadcast, we need simply copy the first into the following "M" ones

567

for(int i = 1; i < m * batch_size; i++)

568

{

569

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

574

}

575

576

TensorType _target{};

577

SimpleTensor<T> _reference{};

578

};

579

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

580

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

581

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

582

{

583

public:

584

template <typename...>

585

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

586

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

587

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

588

ARM_COMPUTE_UNUSED(broadcast_bias);

589

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

590

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

595

lhs_info.transpose = true;

596

597

GEMMRHSMatrixInfo rhs_info;

598

rhs_info.n0 = 16 / sizeof(T);

599

rhs_info.k0 = 1;

600

rhs_info.h0 = h0;

601

rhs_info.interleave = false;

602

rhs_info.transpose = false;

603

604

// In case of GEMM3D, m is the product between m_w and m_h

605

const unsigned int m = m_w * m_h;

606

607

// Set the tensor shapes for LHS and RHS matrices

608

const TensorShape lhs_shape(k, m, batch_size);

609

const TensorShape rhs_shape(n, k, batch_size);

610

const TensorShape bias_shape(n, 1, 1);

611

612

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

613

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

618

void fill(U &&tensor, int i)

619

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

620

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

621

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

622

623

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

624

library->fill(tensor, distribution, i);

625

}

626

627

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

628

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

629

{

630

// Create tensors

631

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

632

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

633

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

634

TensorType lhs_reshaped;

635

TensorType rhs_reshaped;

636

TensorType dst;

637

638

const unsigned int m = lhs_shape[1];

639

const unsigned int n = rhs_shape[0];

640

const unsigned int k = lhs_shape[0];

641

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

642

643

// The output tensor will be auto-initialized within the function

644

645

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

646

ReshapeLHSOperatorType reshape_lhs;

647

ReshapeRHSOperatorType reshape_rhs;

648

GEMMOperatorType gemm;

649

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

650

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

651

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

652

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

653

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

654

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

655

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

656

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

657

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

658

if(!rhs_info.export_to_cl_image)

659

{

660

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

661

}

662

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

663

// Allocate tensors

664

lhs.allocator()->allocate();

665

rhs.allocator()->allocate();

666

lhs_reshaped.allocator()->allocate();

667

rhs_reshaped.allocator()->allocate();

668

bias.allocator()->allocate();

669

dst.allocator()->allocate();

670

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

671

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

672

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

673

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

674

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

675

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

676

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

677

678

// Fill tensors

679

fill(AccessorType(lhs), 0);

680

fill(AccessorType(rhs), 1);

681

fill(AccessorType(bias), 2);

682

683

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

684

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

685

reshape_lhs.run(reshape_lhs_pack);

686

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

687

reshape_rhs.run(reshape_rhs_pack);

688

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

689

{ ACL_SRC_1, &rhs_reshaped },

690

{ ACL_SRC_2, &bias },

691

{ ACL_DST, &dst }

692

});

693

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

698

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

699

const ActivationLayerInfo &act_info)

700

{

701

TensorShape dst_shape = lhs_shape;

702

dst_shape.set(0, rhs_shape[0]);

703

dst_shape.set(1, lhs_shape[1] / m_h);

704

dst_shape.set(2, m_h);

705

dst_shape.set(3, lhs_shape[2]);

706

707

// Create reference

708

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

709

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

710

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

711

712

const int n = rhs_shape[0];

713

const int m = lhs_shape[1];

714

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

722

for(int i = 1; i < m * batch_size; i++)

723

{

724

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

725

}

726

727

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

728

}

729

730

TensorType _target{};

731

SimpleTensor<T> _reference{};

732

};

733

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

734

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

735

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

736

{

737

public:

738

template <typename...>

739

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

740

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

741

{

742

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

747

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

748

749

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

754

rhs_info.transpose = !lhs_transpose;

755

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

756

757

// Set the tensor shapes for LHS and RHS matrices

758

const TensorShape lhs_shape(k, m, batch_size);

759

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

760

const TensorShape bias_shape(n,

761

broadcast_bias ? 1 : m,

762

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

763

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

764

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

765

if(validate_result)

766

{

767

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

768

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

773

void fill(U &&tensor, int i)

774

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

775

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

776

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

777

778

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

779

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

780

781

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

782

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

783

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

784

}

785

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

786

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

787

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

788

{

789

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

790

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

791

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

792

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

793

TensorType lhs_reshaped;

794

TensorType rhs_reshaped;

795

TensorType dst;

796

797

const unsigned int M = lhs_shape[1];

798

const unsigned int N = rhs_shape[0];

799

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

800

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

805

kernel_info.reinterpret_input_as_3d = false;

806

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

807

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

808

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

809

810

// The output tensor will be auto-initialized within the function

811

812

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

813

ReshapeLHSOperatorType reshape_lhs;

814

ReshapeRHSOperatorType reshape_rhs;

815

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

816

817

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

818

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

824

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

825

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

826

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

827

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

828

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

829

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

830

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

831

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

832

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

833

if(!rhs_info.export_to_cl_image)

834

{

835

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

836

}

837

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

838

// Allocate tensors

839

lhs.allocator()->allocate();

840

rhs.allocator()->allocate();

841

lhs_reshaped.allocator()->allocate();

842

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

843

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

844

dst.allocator()->allocate();

845

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

846

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

847

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

848

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

849

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

850

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

851

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

852

853

// Fill tensors

854

fill(AccessorType(lhs), 0);

855

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

856

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

857

858

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

859

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

860

reshape_lhs.run(reshape_lhs_pack);

861

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

862

reshape_rhs.run(reshape_rhs_pack);

863

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

864

{ ACL_SRC_1, &rhs_reshaped },

865

{ ACL_SRC_2, &bias },

866

{ ACL_DST, &dst }

867

});

868

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

873

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

874

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

875

{

876

TensorShape dst_shape = lhs_shape;

877

dst_shape[0] = rhs_shape[0];

878

dst_shape[1] = lhs_shape[1];

879

880

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

881

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

882

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

883

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

884

885

const int n = rhs_shape[0];

886

const int m = lhs_shape[1];

887

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

892

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

893

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

894

if(broadcast_bias)

895

{

896

// In case of broadcast, we need simply copy the first into the following "M" ones

897

for(int i = 1; i < m * batch_size; i++)

898

{

899

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

903

if(fp_mixed_precision)

904

{

905

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

910

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

911

}

912

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

913

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

914

TensorType _target{};

915

SimpleTensor<T> _reference{};

916

};

917

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

918

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

919

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

920

{

921

public:

922

template <typename...>

923

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

924

bool interleave_lhs, bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

925

{

926

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

931

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

932

933

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

938

rhs_info.transpose = !lhs_transpose;

939

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

940

941

// In case of GEMM3D, m is the product between m_w and m_h

942

const unsigned int m = m_w * m_h;

943

944

// Set the tensor shapes for LHS and RHS matrices

945

const TensorShape lhs_shape(k, m, batch_size);

946

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

947

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

948

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

949

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

950

if(validate_result)

951

{

952

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

953

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

958

void fill(U &&tensor, int i)

959

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

960

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

961

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

962

963

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

964

library->fill(tensor, distribution, i);

965

}

966

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

967

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

968

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

969

{

970

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

971

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

972

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

973

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

974

TensorType lhs_reshaped;

975

TensorType rhs_reshaped;

976

TensorType dst;

977

978

const unsigned int M = lhs_shape[1];

979

const unsigned int N = rhs_shape[0];

980

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

981

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

986

kernel_info.reinterpret_input_as_3d = false;

987

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

988

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

989

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

990

991

// The output tensor will be auto-initialized within the function

992

993

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

994

ReshapeLHSOperatorType reshape_lhs;

995

ReshapeRHSOperatorType reshape_rhs;

996

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

997

998

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

999

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1005

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1006

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1007

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1008

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1009

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1010

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1011

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1012

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1013

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1014

if(!rhs_info.export_to_cl_image)

1015

{

1016

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1017

}

1018

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1019

// Allocate tensors

1020

lhs.allocator()->allocate();

1021

rhs.allocator()->allocate();

1022

lhs_reshaped.allocator()->allocate();

1023

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1024

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1025

dst.allocator()->allocate();

1026

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1027

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1028

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1029

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1030

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1031

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1032

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1033

1034

// Fill tensors

1035

fill(AccessorType(lhs), 0);

1036

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1037

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1038

1039

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1040

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1041

reshape_lhs.run(reshape_lhs_pack);

1042

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1043

reshape_rhs.run(reshape_rhs_pack);

1044

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1045

{ ACL_SRC_1, &rhs_reshaped },

1046

{ ACL_SRC_2, &bias },

1047

{ ACL_DST, &dst }

1048

});

1049

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1054

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1055

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1056

{

1057

TensorShape dst_shape = lhs_shape;

1058

dst_shape.set(0, rhs_shape[0]);

1059

dst_shape.set(1, lhs_shape[1] / m_h);

1060

dst_shape.set(2, m_h);

1061

dst_shape.set(3, lhs_shape[2]);

1062

1063

// Create reference

1064

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1065

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1066

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1067

1068

const int n = rhs_shape[0];

1069

const int m = lhs_shape[1];

1070

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1075

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1076

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1077

// In case of broadcast, we need simply copy the first into the following "M" ones

1078

for(int i = 1; i < m * batch_size; i++)

1079

{

1080

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1081

}

1082

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1083

if(fp_mixed_precision)

1084

{

1085

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

1090

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1091

}

1092

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1093

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1094

TensorType _target{};

1095

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

1096

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1097

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1098

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1099

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1100

{

1101

public:

1102

template <typename...>

1103

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

1104

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1105

{

1106

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1115

rhs_info.transpose = transpose_rhs;

1116

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1117

1118

// Set the tensor shapes for LHS and RHS matrices

1119

const TensorShape lhs_shape(k, m, batch_size);

1120

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1121

const TensorShape bias_shape(n,

1122

broadcast_bias ? 1 : m,

1123

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1124

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1125

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1126

if(validate_result)

1127

{

1128

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

1129

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1134

void fill(U &&tensor, int i)

1135

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1136

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1137

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1138

1139

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1140

library->fill(tensor, distribution, i);

1141

1142

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1143

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1144

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1145

}

1146

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1147

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1148

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1149

{

1150

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1151

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1152

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1153

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1154

TensorType rhs_reshaped;

1155

TensorType dst;

1156

1157

const unsigned int M = lhs_shape[1];

1158

const unsigned int N = rhs_shape[0];

1159

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1160

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1165

kernel_info.reinterpret_input_as_3d = false;

1166

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1167

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1168

1169

// The output tensor will be auto-initialized within the function

1170

1171

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1172

ReshapeRHSOperatorType reshape_rhs;

1173

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1174

1175

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1176

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1182

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1183

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1184

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1185

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1186

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1187

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1188

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1189

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1190

if(!rhs_info.export_to_cl_image)

1191

{

1192

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1193

}

1194

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1195

// Allocate tensors

1196

lhs.allocator()->allocate();

1197

rhs.allocator()->allocate();

1198

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1199

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1200

dst.allocator()->allocate();

1201

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1202

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1203

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1204

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1205

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1206

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1207

1208

// Fill tensors

1209

fill(AccessorType(lhs), 0);

1210

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1211

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1212

1213

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1214

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1215

reshape_rhs.run(reshape_rhs_pack);

1216

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1217

{ ACL_SRC_1, &rhs_reshaped },

1218

{ ACL_SRC_2, &bias },

1219

{ ACL_DST, &dst }

1220

});

1221

gemm.run(gemm_pack);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1226

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1227

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1228

{

1229

TensorShape dst_shape = lhs_shape;

1230

dst_shape[0] = rhs_shape[0];

1231

dst_shape[1] = lhs_shape[1];

1232

1233

// Create reference

1234

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1235

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1236

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1237

1238

const int n = rhs_shape[0];

1239

const int m = lhs_shape[1];

1240

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1245

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1246

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1247

if(broadcast_bias)

1248

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1249

// In case of broadcast, we need simply copy the first into the following "M" ones

1250

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1251

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1252

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1253

}

1254

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1255

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1256

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1257

}

1258

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1259

bool validate_result = true;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1260

TensorType _target{};

1261

SimpleTensor<T> _reference{};

1262

};

1263

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1264

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1265

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1266

{

1267

public:

1268

template <typename...>

1269

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1270

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, bool has_pad_y, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1271

{

1272

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1281

rhs_info.transpose = transpose_rhs;

1282

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1283

1284

// In case of GEMM3D, m is the product between m_w and m_h

1285

const unsigned int m = m_w * m_h;

1286

1287

// Set the tensor shapes for LHS and RHS matrices

1288

const TensorShape lhs_shape(k, m, batch_size);

1289

const TensorShape rhs_shape(n, k, batch_size);

1290

const TensorShape bias_shape(n, 1, 1);

1291

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1292

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info, has_pad_y);

1293

if(validate_result)

1294

{

1295

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1296

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1301

void fill(U &&tensor, int i)

1302

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1303

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1304

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1305

1306

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1307

library->fill(tensor, distribution, i);

1308

}

1309

1310

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1311

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1312

unsigned int m_h, const ActivationLayerInfo &act_info, bool has_pad_y)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1313

{

1314

// Create tensors

1315

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1316

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1317

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1318

TensorType rhs_reshaped;

1319

TensorType dst;

1320

1321

const unsigned int M = lhs_shape[1];

1322

const unsigned int N = rhs_shape[0];

1323

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1324

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1329

kernel_info.reinterpret_input_as_3d = false;

1330

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1331

kernel_info.activation_info = act_info;

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1332

kernel_info.has_pad_y = has_pad_y;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1333

1334

// The output tensor will be auto-initialized within the function

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1335

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1336

ReshapeRHSOperatorType reshape_rhs;

1337

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1338

1339

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1340

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1346

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1347

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1348

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1349

if(has_pad_y)

1350

{

1351

// Add dummy padding into lhs to validate has_pad_y path

1352

lhs.info()->extend_padding(PaddingSize(2, 0, 2, 0));

1353

dst.info()->extend_padding(PaddingSize(2, 0, 1, 0));

1354

}

1355

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1356

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1357

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1358

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1359

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1360

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1361

if(!rhs_info.export_to_cl_image)

1362

{

1363

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1364

}

1365

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1366

// Allocate tensors

1367

lhs.allocator()->allocate();

1368

rhs.allocator()->allocate();

1369

rhs_reshaped.allocator()->allocate();

1370

bias.allocator()->allocate();

1371

dst.allocator()->allocate();

1372

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1373

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1374

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1375

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1376

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1377

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1378

1379

// Fill tensors

1380

fill(AccessorType(lhs), 0);

1381

fill(AccessorType(rhs), 1);

1382

fill(AccessorType(bias), 2);

1383

1384

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1385

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1386

reshape_rhs.run(reshape_rhs_pack);

1387

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1388

{ ACL_SRC_1, &rhs_reshaped },

1389

{ ACL_SRC_2, &bias },

1390

{ ACL_DST, &dst }

1391

});

1392

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1397

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1398

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1399

{

1400

TensorShape dst_shape = lhs_shape;

1401

dst_shape.set(0, rhs_shape[0]);

1402

dst_shape.set(1, lhs_shape[1] / m_h);

1403

dst_shape.set(2, m_h);

1404

dst_shape.set(3, lhs_shape[2]);

1405

1406

// Create reference

1407

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1408

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1409

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1410

1411

const int n = rhs_shape[0];

1412

const int m = lhs_shape[1];

1413

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

// In case of broadcast, we need simply copy the first into the following "M" ones

1421

for(int i = 1; i < m * batch_size; i++)

1422

{

1423

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1424

}

1425

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1426

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1427

}

1428

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1429

bool validate_result = true;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1430

TensorType _target{};

1431

SimpleTensor<T> _reference{};

1432

};

1433

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1434

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1435

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1436

{

1437

public:

1438

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1439

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1440

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1441

{

1442

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1451

const TensorShape lhs_shape(k, m, batch_size);

1452

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1453

const TensorShape bias_shape(n,

1454

broadcast_bias ? 1 : m,

1455

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1456

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1457

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1458

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1463

void fill(U &&tensor, int i)

1464

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1465

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1466

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1467

1468

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1469

library->fill(tensor, distribution, i);

1470

1471

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1472

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1473

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1474

}

1475

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1476

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1477

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1478

{

1479

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1480

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1481

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1482

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1483

TensorType dst;

1484

1485

const unsigned int M = lhs_shape[1];

1486

const unsigned int N = rhs_shape[0];

1487

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1488

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1493

kernel_info.reinterpret_input_as_3d = false;

1494

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1495

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1496

1497

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1498

GEMMOperatorType gemm;

1499

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1500

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1501

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1502

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1503

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1504

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1505

add_padding_x({ &lhs, &rhs, &bias, &dst });

1506

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1507

// Allocate tensors

1508

lhs.allocator()->allocate();

1509

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1510

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1511

dst.allocator()->allocate();

1512

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1513

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1514

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1515

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1516

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1517

1518

// Fill tensors

1519

fill(AccessorType(lhs), 0);

1520

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1521

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1522

1523

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1524

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1525

{ ACL_SRC_1, &rhs },

1526

{ ACL_SRC_2, &bias },

1527

{ ACL_DST, &dst }

1528

});

1529

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1534

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1535

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1536

{

1537

TensorShape dst_shape = lhs_shape;

1538

dst_shape[0] = rhs_shape[0];

1539

dst_shape[1] = lhs_shape[1];

1540

1541

// Create reference

1542

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1543

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1544

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1545

1546

const int n = rhs_shape[0];

1547

const int m = lhs_shape[1];

1548

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1553

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1554

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1555

if(broadcast_bias)

1556

{

1557

// In case of broadcast, we need simply copy the first into the following "M" ones

1558

for(int i = 1; i < m * batch_size; i++)

1559

{

1560

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1564

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1565

}

1566

1567

TensorType _target{};

1568

SimpleTensor<T> _reference{};

1569

};

1570

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1571

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1572

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

1573

{

1574

public:

1575

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1576

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

1577

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1578

{

1579

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

1588

const unsigned int m = m_w * m_h;

1589

1590

// Set the tensor shapes for LHS and RHS matrices

1591

const TensorShape lhs_shape(k, m, batch_size);

1592

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1593

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1594

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1595

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1596

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1601

void fill(U &&tensor, int i)

1602

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1603

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1604

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1605

1606

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1607

library->fill(tensor, distribution, i);

1608

}

1609

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1610

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1611

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1612

{

1613

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1614

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1615

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1616

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1617

TensorType dst;

1618

1619

const unsigned int M = lhs_shape[1];

1620

const unsigned int N = rhs_shape[0];

1621

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1622

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1627

kernel_info.reinterpret_input_as_3d = false;

1628

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1629

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1630

1631

// The output tensor will be auto-initialized within the function

1632

1633

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1634

GEMMOperatorType gemm;

1635

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1636

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1637

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1638

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1639

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1640

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1641

add_padding_x({ &lhs, &rhs, &bias, &dst });

1642

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1643

// Allocate tensors

1644

lhs.allocator()->allocate();

1645

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1646

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1647

dst.allocator()->allocate();

1648

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1649

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1650

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1651

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1652

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1653

1654

// Fill tensors

1655

fill(AccessorType(lhs), 0);

1656

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1657

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1658

1659

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1660

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1661

{ ACL_SRC_1, &rhs },

1662

{ ACL_SRC_2, &bias },

1663

{ ACL_DST, &dst }

1664

});

1665

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1670

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1671

const ActivationLayerInfo &act_info)

giuros01