Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

52

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

54

public:

55

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

56

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

57

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

58

ARM_COMPUTE_UNUSED(pretranspose);

59

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

60

_reference = compute_reference(shape_a, shape_b, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

65

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

66

{

67

switch(tensor.data_type())

68

{

69

case DataType::F16:

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

70

{

Giorgio Arena

a8e2aeb

2021-01-06 11:34:57 +0000

[diff] [blame]

71

arm_compute::utils::uniform_real_distribution_16bit<half> distribution{ float(lo), float(hi) };

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

72

library->fill(tensor, distribution, i);

73

break;

74

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

75

case DataType::F32:

76

{

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

77

std::uniform_real_distribution<float> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

78

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

87

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

88

{

89

// Create tensors

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

90

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

91

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

92

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

93

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

94

95

// Create and configure function

96

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

97

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

98

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

99

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

100

gemm.configure(&a,

101

&b,

102

(disable_c) ? nullptr : &c,

103

&dst,

104

alpha, beta,

Georgios Pinitas

4ee8b15

2021-07-16 16:16:43 +0100

[diff] [blame]

105

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, false, (reinterpret_input_as_3d

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

106

|| reinterpret_output_as_3d)));

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

107

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

108

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

109

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

110

ARM_COMPUTE_ASSERT(dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

111

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

112

add_padding_x({ &a, &b, &c, &dst });

113

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

114

// Allocate tensors

115

a.allocator()->allocate();

116

b.allocator()->allocate();

117

c.allocator()->allocate();

118

dst.allocator()->allocate();

119

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

120

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

121

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

122

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

123

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

124

125

// Fill tensors

126

fill(AccessorType(a), 0);

127

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

128

if(!disable_c)

129

{

130

fill(AccessorType(c), 2);

131

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

132

Mohammed Suhail Munshi

13a2d00

2022-09-05 11:57:34 +0100

[diff] [blame^]

133

// Run with variable inputs.

if(run_twice)

{

gemm.run();

fill(AccessorType(a), 3); // Fill tensors with new seed after run

138

fill(AccessorType(b), 4);

139

if(!disable_c)

140

{

141

fill(AccessorType(c), 5);

}

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

145

// Compute GEMM function

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

151

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

152

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

153

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

154

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

155

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

156

if(reinterpret_input_as_3d)

157

{

158

// Collapse the second and third dimension if the input is 3D

159

shape_a_to_use.collapse(2U, 1U);

160

}

161

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

162

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

163

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

164

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

165

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

170

fill(c, 2);

171

172

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

173

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

174

const int n = shape_b[0];

175

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

176

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

177

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

178

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

179

for(int i = 1; i < m * batch_size; i++)

180

{

181

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

182

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

183

}

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

184

Adnan AlSinan

3bb72b6

2022-05-06 12:10:11 +0100

[diff] [blame]

185

/* Note: Assuming the usual batch matmul dimensions A = (B x M x K), B = (B x K x N), if pretranspose_A is set to true, then A is assumed to be (B x K x M),

186

therefore, A must be pre-transposed before passing it to the fixture. And, we transpose A again in the fixture to make it (B x M x K)

187

in order to be able to call reference implementation that works with (B x M x K) input.

188

Similarly, if pretranspose_B is set to true, then B is assumed to be (B x N x K), B must be pre-transposed before passing it to the fixture. */

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

189

Mohammed Suhail Munshi

bc5c407

2022-04-27 13:49:51 +0100

[diff] [blame]

190

// Define transposed shapes

191

TensorShape a_transposed_shape(a.shape().y(), a.shape().x());

192

TensorShape b_transposed_shape(b.shape().y(), b.shape().x());

193

194

// Define transposed tensors

195

SimpleTensor<T> a_transposed{ a_transposed_shape, data_type };

196

SimpleTensor<T> b_transposed{ b_transposed_shape, data_type };

197

198

// pretranspose a if necessary

199

if(pretranspose_a)

200

{

201

transpose_matrix<T>(a, a_transposed);

202

}

203

204

// pretranspose b if necessary

205

if(pretranspose_b)

206

{

207

transpose_matrix<T>(b, b_transposed);

208

}

209

Mohammed Suhail Munshi

13a2d00

2022-09-05 11:57:34 +0100

[diff] [blame^]

210

// Run with variable inputs.

211

if(run_twice)

212

{

213

reference::gemm<T>((pretranspose_a) ? a_transposed : a, (pretranspose_b) ? b_transposed : b, c, alpha, disable_c ? 0.f : beta);

214

fill((pretranspose_a) ? a_transposed : a, 3);

215

fill((pretranspose_b) ? b_transposed : b, 4);

fill(c , 5);

}

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

219

// Setting beta to 0 will effectively disable C for the

220

// computation of the reference: alpha * A * B + 0 * C

Mohammed Suhail Munshi

bc5c407

2022-04-27 13:49:51 +0100

[diff] [blame]

221

// Use transposed tensors if boolean enabled else use original tensors

Mohammed Suhail Munshi

13a2d00

2022-09-05 11:57:34 +0100

[diff] [blame^]

222

auto r = reference::gemm<T>((pretranspose_a) ? a_transposed : a, (pretranspose_b) ? b_transposed : b, c, alpha, disable_c ? 0.f : beta);

223

return r;

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

224

}

225

226

TensorType _target{};

227

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

228

};

229

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

230

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

231

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

232

{

233

public:

234

template <typename...>

235

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

236

DataType data_type, GPUTarget gpu_arch)

237

{

238

// Set the tensor shapes for LHS and RHS matrices

239

const TensorShape lhs_shape(k, m, batch_size);

240

const TensorShape rhs_shape(n, k, batch_size);

241

const TensorShape bias_shape(n,

242

broadcast_bias ? 1 : m,

243

broadcast_bias ? 1 : batch_size);

244

245

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

246

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

251

void fill(U &&tensor, int i)

252

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

253

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

254

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

255

256

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

257

library->fill(tensor, distribution, i);

258

259

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

260

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

261

library->fill_borders_with_garbage(tensor, distribution_inf, i);

262

}

263

264

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

265

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

266

{

267

// Create tensors

268

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

269

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

270

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

271

TensorType dst;

272

273

const unsigned int m = lhs_shape[1];

274

const unsigned int n = rhs_shape[0];

275

const unsigned int k = lhs_shape[0];

276

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

277

278

// The output tensor will be auto-initialized within the function

279

280

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

281

GEMMOperatorType gemm;

282

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

283

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

284

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

285

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

286

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

287

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

288

add_padding_x({ &lhs, &rhs, &bias, &dst });

289

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

290

// Allocate tensors

291

lhs.allocator()->allocate();

292

rhs.allocator()->allocate();

293

bias.allocator()->allocate();

294

dst.allocator()->allocate();

295

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

296

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

297

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

298

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

299

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

300

301

// Fill tensors

302

fill(AccessorType(lhs), 0);

303

fill(AccessorType(rhs), 1);

304

fill(AccessorType(bias), 2);

305

306

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

307

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

308

{ ACL_SRC_1, &rhs },

309

{ ACL_SRC_2, &bias },

310

{ ACL_DST, &dst }

311

});

312

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

317

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

318

const ActivationLayerInfo &act_info)

319

{

320

TensorShape dst_shape = lhs_shape;

321

dst_shape[0] = rhs_shape[0];

322

dst_shape[1] = lhs_shape[1];

323

324

// Create reference

325

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

326

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

327

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

328

329

const int n = rhs_shape[0];

330

const int m = lhs_shape[1];

331

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

340

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

341

for(int i = 1; i < m * batch_size; i++)

342

{

343

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

348

}

349

350

TensorType _target{};

351

SimpleTensor<T> _reference{};

352

};

353

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

354

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

355

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

356

{

357

public:

358

template <typename...>

359

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

360

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

361

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

362

ARM_COMPUTE_UNUSED(broadcast_bias);

363

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

364

// In case of GEMM3D, m is the product between m_w and m_h

365

const unsigned int m = m_w * m_h;

366

367

// Set the tensor shapes for LHS and RHS matrices

368

const TensorShape lhs_shape(k, m, batch_size);

369

const TensorShape rhs_shape(n, k, batch_size);

370

const TensorShape bias_shape(n, 1, 1);

371

372

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

373

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

378

void fill(U &&tensor, int i)

379

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

380

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

381

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

382

383

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

384

library->fill(tensor, distribution, i);

385

}

386

387

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

388

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

389

{

390

// Create tensors

391

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

392

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

393

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

394

TensorType dst;

395

396

const unsigned int m = lhs_shape[1];

397

const unsigned int n = rhs_shape[0];

398

const unsigned int k = lhs_shape[0];

399

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

400

401

// The output tensor will be auto-initialized within the function

402

403

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

404

GEMMOperatorType gemm;

405

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

406

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

407

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

408

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

409

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

410

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

411

add_padding_x({ &lhs, &rhs, &bias, &dst });

412

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

413

// Allocate tensors

414

lhs.allocator()->allocate();

415

rhs.allocator()->allocate();

416

bias.allocator()->allocate();

417

dst.allocator()->allocate();

418

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

419

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

420

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

421

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

422

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

423

424

// Fill tensors

425

fill(AccessorType(lhs), 0);

426

fill(AccessorType(rhs), 1);

427

fill(AccessorType(bias), 2);

428

429

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

430

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

431

{ ACL_SRC_1, &rhs },

432

{ ACL_SRC_2, &bias },

433

{ ACL_DST, &dst }

434

});

435

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

440

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

441

const ActivationLayerInfo &act_info)

442

{

443

TensorShape dst_shape = lhs_shape;

444

dst_shape.set(0, rhs_shape[0]);

445

dst_shape.set(1, lhs_shape[1] / m_h);

446

dst_shape.set(2, m_h);

447

dst_shape.set(3, lhs_shape[2]);

448

449

// Create reference

450

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

451

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

452

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

453

454

const int n = rhs_shape[0];

455

const int m = lhs_shape[1];

456

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

463

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

464

for(int i = 1; i < m * batch_size; i++)

465

{

466

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

467

}

468

469

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

470

}

471

472

TensorType _target{};

473

SimpleTensor<T> _reference{};

474

};

475

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

476

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

477

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

478

{

479

public:

480

template <typename...>

481

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

482

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

483

{

484

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

489

lhs_info.transpose = true;

490

491

GEMMRHSMatrixInfo rhs_info;

492

rhs_info.n0 = 16 / sizeof(T);

493

rhs_info.k0 = 1;

494

rhs_info.h0 = h0;

495

rhs_info.interleave = false;

496

rhs_info.transpose = false;

497

498

// Set the tensor shapes for LHS and RHS matrices

499

const TensorShape lhs_shape(k, m, batch_size);

500

const TensorShape rhs_shape(n, k, batch_size);

501

const TensorShape bias_shape(n,

502

broadcast_bias ? 1 : m,

503

broadcast_bias ? 1 : batch_size);

504

505

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

506

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

511

void fill(U &&tensor, int i)

512

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

513

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

514

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

515

516

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

517

library->fill(tensor, distribution, i);

518

519

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

520

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

521

library->fill_borders_with_garbage(tensor, distribution_inf, i);

522

}

523

524

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

525

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

526

{

527

// Create tensors

528

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

529

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

530

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

531

TensorType lhs_reshaped;

532

TensorType rhs_reshaped;

533

TensorType dst;

534

535

const unsigned int m = lhs_shape[1];

536

const unsigned int n = rhs_shape[0];

537

const unsigned int k = lhs_shape[0];

538

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

539

540

// The output tensor will be auto-initialized within the function

541

542

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

543

ReshapeLHSOperatorType reshape_lhs;

544

ReshapeRHSOperatorType reshape_rhs;

545

GEMMOperatorType gemm;

546

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

547

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

548

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

549

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

550

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

551

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

552

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

553

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

554

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

555

if(!rhs_info.export_to_cl_image)

556

{

557

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

558

}

559

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

560

// Allocate tensors

561

lhs.allocator()->allocate();

562

rhs.allocator()->allocate();

563

lhs_reshaped.allocator()->allocate();

564

rhs_reshaped.allocator()->allocate();

565

bias.allocator()->allocate();

566

dst.allocator()->allocate();

567

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

568

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

569

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

570

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

571

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

572

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

573

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

574

575

// Fill tensors

576

fill(AccessorType(lhs), 0);

577

fill(AccessorType(rhs), 1);

578

fill(AccessorType(bias), 2);

579

580

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

581

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

582

reshape_lhs.run(reshape_lhs_pack);

583

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

584

reshape_rhs.run(reshape_rhs_pack);

585

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

586

{ ACL_SRC_1, &rhs_reshaped },

587

{ ACL_SRC_2, &bias },

588

{ ACL_DST, &dst }

589

});

590

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

595

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

596

const ActivationLayerInfo &act_info)

597

{

598

TensorShape dst_shape = lhs_shape;

599

dst_shape[0] = rhs_shape[0];

600

dst_shape[1] = lhs_shape[1];

601

602

// Create reference

603

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

604

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

605

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

606

607

const int n = rhs_shape[0];

608

const int m = lhs_shape[1];

609

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

618

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

619

for(int i = 1; i < m * batch_size; i++)

620

{

621

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

626

}

627

628

TensorType _target{};

629

SimpleTensor<T> _reference{};

630

};

631

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

632

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

633

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

634

{

635

public:

636

template <typename...>

637

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

638

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

639

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

640

ARM_COMPUTE_UNUSED(broadcast_bias);

641

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

642

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

647

lhs_info.transpose = true;

648

649

GEMMRHSMatrixInfo rhs_info;

650

rhs_info.n0 = 16 / sizeof(T);

651

rhs_info.k0 = 1;

652

rhs_info.h0 = h0;

653

rhs_info.interleave = false;

654

rhs_info.transpose = false;

655

656

// In case of GEMM3D, m is the product between m_w and m_h

657

const unsigned int m = m_w * m_h;

658

659

// Set the tensor shapes for LHS and RHS matrices

660

const TensorShape lhs_shape(k, m, batch_size);

661

const TensorShape rhs_shape(n, k, batch_size);

662

const TensorShape bias_shape(n, 1, 1);

663

664

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

665

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

670

void fill(U &&tensor, int i)

671

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

672

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

673

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

674

675

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

676

library->fill(tensor, distribution, i);

677

}

678

679

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

680

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

681

{

682

// Create tensors

683

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

684

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

685

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

686

TensorType lhs_reshaped;

687

TensorType rhs_reshaped;

688

TensorType dst;

689

690

const unsigned int m = lhs_shape[1];

691

const unsigned int n = rhs_shape[0];

692

const unsigned int k = lhs_shape[0];

693

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

694

695

// The output tensor will be auto-initialized within the function

696

697

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

698

ReshapeLHSOperatorType reshape_lhs;

699

ReshapeRHSOperatorType reshape_rhs;

700

GEMMOperatorType gemm;

701

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

702

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

703

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

704

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

705

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

706

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

707

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

708

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

709

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

710

if(!rhs_info.export_to_cl_image)

711

{

712

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

713

}

714

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

715

// Allocate tensors

716

lhs.allocator()->allocate();

717

rhs.allocator()->allocate();

718

lhs_reshaped.allocator()->allocate();

719

rhs_reshaped.allocator()->allocate();

720

bias.allocator()->allocate();

721

dst.allocator()->allocate();

722

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

723

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

724

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

725

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

726

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

727

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

728

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

729

730

// Fill tensors

731

fill(AccessorType(lhs), 0);

732

fill(AccessorType(rhs), 1);

733

fill(AccessorType(bias), 2);

734

735

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

736

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

737

reshape_lhs.run(reshape_lhs_pack);

738

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

739

reshape_rhs.run(reshape_rhs_pack);

740

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

741

{ ACL_SRC_1, &rhs_reshaped },

742

{ ACL_SRC_2, &bias },

743

{ ACL_DST, &dst }

744

});

745

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

750

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

751

const ActivationLayerInfo &act_info)

752

{

753

TensorShape dst_shape = lhs_shape;

754

dst_shape.set(0, rhs_shape[0]);

755

dst_shape.set(1, lhs_shape[1] / m_h);

756

dst_shape.set(2, m_h);

757

dst_shape.set(3, lhs_shape[2]);

758

759

// Create reference

760

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

761

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

762

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

763

764

const int n = rhs_shape[0];

765

const int m = lhs_shape[1];

766

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

773

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

774

for(int i = 1; i < m * batch_size; i++)

775

{

776

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

777

}

778

779

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

780

}

781

782

TensorType _target{};

783

SimpleTensor<T> _reference{};

784

};

785

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

786

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

787

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

788

{

789

public:

790

template <typename...>

791

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

792

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

793

{

794

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

799

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

800

801

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

806

rhs_info.transpose = !lhs_transpose;

807

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

808

809

// Set the tensor shapes for LHS and RHS matrices

810

const TensorShape lhs_shape(k, m, batch_size);

811

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

812

const TensorShape bias_shape(n,

813

broadcast_bias ? 1 : m,

814

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

815

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

816

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

817

if(validate_result)

818

{

819

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

820

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

825

void fill(U &&tensor, int i)

826

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

827

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

828

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

829

830

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

831

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

832

833

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

834

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

835

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

836

}

837

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

838

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

839

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

840

{

841

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

842

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

843

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

844

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

845

TensorType lhs_reshaped;

846

TensorType rhs_reshaped;

847

TensorType dst;

848

849

const unsigned int M = lhs_shape[1];

850

const unsigned int N = rhs_shape[0];

851

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

852

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

857

kernel_info.reinterpret_input_as_3d = false;

858

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

859

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

860

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

861

862

// The output tensor will be auto-initialized within the function

863

864

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

865

ReshapeLHSOperatorType reshape_lhs;

866

ReshapeRHSOperatorType reshape_rhs;

867

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

868

869

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

870

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

876

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

877

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

878

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

879

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

880

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

881

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

882

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

883

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

884

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

885

if(!rhs_info.export_to_cl_image)

886

{

887

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

888

}

889

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

890

// Allocate tensors

891

lhs.allocator()->allocate();

892

rhs.allocator()->allocate();

893

lhs_reshaped.allocator()->allocate();

894

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

895

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

896

dst.allocator()->allocate();

897

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

898

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

899

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

900

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

901

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

902

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

903

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

904

905

// Fill tensors

906

fill(AccessorType(lhs), 0);

907

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

908

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

909

910

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

911

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

912

reshape_lhs.run(reshape_lhs_pack);

913

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

914

reshape_rhs.run(reshape_rhs_pack);

915

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

916

{ ACL_SRC_1, &rhs_reshaped },

917

{ ACL_SRC_2, &bias },

918

{ ACL_DST, &dst }

919

});

920

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

925

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

926

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

927

{

928

TensorShape dst_shape = lhs_shape;

929

dst_shape[0] = rhs_shape[0];

930

dst_shape[1] = lhs_shape[1];

931

932

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

933

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

934

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

935

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

936

937

const int n = rhs_shape[0];

938

const int m = lhs_shape[1];

939

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

944

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

945

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

946

if(broadcast_bias)

947

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

948

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

949

for(int i = 1; i < m * batch_size; i++)

950

{

951

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

955

if(fp_mixed_precision)

956

{

957

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

962

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

963

}

964

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

965

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

966

TensorType _target{};

967

SimpleTensor<T> _reference{};

968

};

969

SiCongLi

1af5416

2021-10-06 15:25:57 +0100

[diff] [blame]

970

/** (EXPERIMENTAL_POST_OPS)*/

971

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

972

class GEMMMatrixMultiplyReshapedWithPostOpsValidationFixture : public framework::Fixture

973

{

974

public:

975

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

976

public:

977

template <typename...>

978

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

979

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info,

980

const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

981

{

982

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

987

lhs_info.transpose = lhs_transpose;

988

989

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

994

rhs_info.transpose = !lhs_transpose;

995

rhs_info.export_to_cl_image = export_to_cl_image;

996

997

// Set the tensor shapes for LHS and RHS matrices

998

const TensorShape lhs_shape(k, m, batch_size);

999

const TensorShape rhs_shape(n, k, batch_size);

1000

const TensorShape bias_shape(n,

1001

broadcast_bias ? 1 : m,

1002

broadcast_bias ? 1 : batch_size);

1003

auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

1004

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

1009

std::get<1>(broadcast) ? 1 : m,

1010

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

1015

if(validate_result)

1016

{

1017

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

}

protected:

template <typename U>

1023

void fill(U &&tensor, int i)

1024

{

1025

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

1026

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

1027

1028

DistributionType distribution{ T(-1.0f), T(1.0f) };

1029

library->fill(tensor, distribution, i);

1030

1031

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1032

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

1033

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1034

}

1035

1036

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1037

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1038

{

1039

// Create tensors

1040

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1041

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1042

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1043

1044

// Create post op tensors and populate post op with them

1045

std::vector<TensorType> post_op_tensors_holder{};

1046

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

1047

[&post_op_tensors_holder, &data_type](auto shape)

1048

{

1049

auto t = create_tensor<TensorType>(shape, data_type, 1);

1050

post_op_tensors_holder.push_back(std::move(t));

1051

return post_op_tensors_holder.back().info();

1052

});

1053

TensorType lhs_reshaped;

1054

TensorType rhs_reshaped;

1055

TensorType dst;

1056

1057

const unsigned int M = lhs_shape[1];

1058

const unsigned int N = rhs_shape[0];

1059

const unsigned int K = lhs_shape[0];

1060

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1065

kernel_info.reinterpret_input_as_3d = false;

1066

kernel_info.broadcast_bias = broadcast_bias;

1067

kernel_info.activation_info = act_info;

1068

kernel_info.fp_mixed_precision = fp_mixed_precision;

1069

kernel_info.post_ops = populated_post_ops;

1070

1071

// The output tensor will be auto-initialized within the function

1072

1073

// Create and configure function

1074

ReshapeLHSOperatorType reshape_lhs;

1075

ReshapeRHSOperatorType reshape_rhs;

1076

GEMMOperatorType gemm;

1077

1078

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1079

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1086

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1087

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

1088

1089

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1090

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1091

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1092

for(const auto &tensor : post_op_tensors_holder)

1093

{

1094

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

1095

}

1096

1097

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

1098

if(!rhs_info.export_to_cl_image)

1099

{

1100

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1101

for(auto &tensor : post_op_tensors_holder)

1102

{

1103

add_padding_x({ &tensor });

}

}

// Allocate tensors

lhs.allocator()->allocate();

1109

rhs.allocator()->allocate();

1110

lhs_reshaped.allocator()->allocate();

1111

rhs_reshaped.allocator()->allocate();

1112

bias.allocator()->allocate();

1113

dst.allocator()->allocate();

1114

for(auto &tensor : post_op_tensors_holder)

1115

{

1116

tensor.allocator()->allocate();

1117

}

1118

1119

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1120

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1121

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1122

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1123

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1124

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1125

for(const auto &tensor : post_op_tensors_holder)

1126

{

1127

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

1132

fill(AccessorType(rhs), 1);

1133

fill(AccessorType(bias), 2);

1134

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1135

{

1136

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1141

reshape_lhs.run(reshape_lhs_pack);

1142

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1143

reshape_rhs.run(reshape_rhs_pack);

1144

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1145

{ ACL_SRC_1, &rhs_reshaped },

1146

{ ACL_SRC_2, &bias },

1147

{ ACL_DST, &dst }

1148

});

1149

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1150

{

1151

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1159

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1160

{

1161

TensorShape dst_shape = lhs_shape;

1162

dst_shape[0] = rhs_shape[0];

1163

dst_shape[1] = lhs_shape[1];

1164

1165

// Create reference

1166

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1167

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1168

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1169

// Create post op tensors and populate post op with them

1170

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

1171

{

1172

return SimpleTensor<T> { shape, data_type, 1 };

1173

});

1174

1175

const int n = rhs_shape[0];

1176

const int m = lhs_shape[1];

1177

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

1182

fill(rhs, tensor_idx++);

1183

fill(bias, tensor_idx++);

1184

for(auto &op : populated_post_ops.get_list())

1185

{

1186

for(auto tensor : op->arguments())

1187

{

1188

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1194

// In case of broadcast, we need to simply copy the first into the following "M" ones

SiCongLi

1af5416

2021-10-06 15:25:57 +0100

[diff] [blame]

1195

for(int i = 1; i < m * batch_size; i++)

1196

{

1197

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

if(fp_mixed_precision)

1203

{

1204

out = reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta);

}

else

{

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

1209

}

1210

// Ignore activation info if post ops are used instead

1211

if(populated_post_ops.size() > 0)

1212

{

1213

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

bool validate_result = true;

1223

TensorType _target{};

1224

SimpleTensor<T> _reference{};

1225

};

1226

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1227

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1228

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

1229

{

1230

public:

1231

template <typename...>

1232

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

1233

bool interleave_lhs, bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1234

{

1235

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

1240

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1241

1242

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1247

rhs_info.transpose = !lhs_transpose;

1248

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1249

1250

// In case of GEMM3D, m is the product between m_w and m_h

1251

const unsigned int m = m_w * m_h;

1252

1253

// Set the tensor shapes for LHS and RHS matrices

1254

const TensorShape lhs_shape(k, m, batch_size);

1255

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1256

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1257

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1258

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

1259

if(validate_result)

1260

{

1261

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1262

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

1267

void fill(U &&tensor, int i)

1268

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1269

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1270

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1271

1272

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1273

library->fill(tensor, distribution, i);

1274

}

1275

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1276

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1277

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1278

{

1279

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1280

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1281

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1282

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1283

TensorType lhs_reshaped;

1284

TensorType rhs_reshaped;

1285

TensorType dst;

1286

1287

const unsigned int M = lhs_shape[1];

1288

const unsigned int N = rhs_shape[0];

1289

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1290

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1295

kernel_info.reinterpret_input_as_3d = false;

1296

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1297

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1298

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1299

1300

// The output tensor will be auto-initialized within the function

1301

1302

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1303

ReshapeLHSOperatorType reshape_lhs;

1304

ReshapeRHSOperatorType reshape_rhs;

1305

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1306

1307

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1308

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1314

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1315

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1316

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1317

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1318

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1319

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1320

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1321

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1322

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1323

if(!rhs_info.export_to_cl_image)

1324

{

1325

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1326

}

1327

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1328

// Allocate tensors

1329

lhs.allocator()->allocate();

1330

rhs.allocator()->allocate();

1331

lhs_reshaped.allocator()->allocate();

1332

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1333

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1334

dst.allocator()->allocate();

1335

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1336

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1337

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1338

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1339

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1340

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1341

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1342

1343

// Fill tensors

1344

fill(AccessorType(lhs), 0);

1345

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1346

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1347

1348

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1349

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1350

reshape_lhs.run(reshape_lhs_pack);

1351

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1352

reshape_rhs.run(reshape_rhs_pack);

1353

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1354

{ ACL_SRC_1, &rhs_reshaped },

1355

{ ACL_SRC_2, &bias },

1356

{ ACL_DST, &dst }

1357

});

1358

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1363

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1364

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1365

{

1366

TensorShape dst_shape = lhs_shape;

1367

dst_shape.set(0, rhs_shape[0]);

1368

dst_shape.set(1, lhs_shape[1] / m_h);

1369

dst_shape.set(2, m_h);

1370

dst_shape.set(3, lhs_shape[2]);

1371

1372

// Create reference

1373

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1374

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1375

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1376

1377

const int n = rhs_shape[0];

1378

const int m = lhs_shape[1];

1379

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1384

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1385

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1386

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1387

for(int i = 1; i < m * batch_size; i++)

1388

{

1389

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1390

}

1391

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1392

if(fp_mixed_precision)

1393

{

1394

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

1399

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1400

}

1401

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1402

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1403

TensorType _target{};

1404

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

1405

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1406

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1407

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1408

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1409

{

1410

public:

1411

template <typename...>

1412

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

1413

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1414

{

1415

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1424

rhs_info.transpose = transpose_rhs;

1425

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1426

1427

// Set the tensor shapes for LHS and RHS matrices

1428

const TensorShape lhs_shape(k, m, batch_size);

1429

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1430

const TensorShape bias_shape(n,

1431

broadcast_bias ? 1 : m,

1432

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1433

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1434

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1435

if(validate_result)

1436

{

1437

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

1438

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1443

void fill(U &&tensor, int i)

1444

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1445

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1446

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1447

1448

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1449

library->fill(tensor, distribution, i);

1450

1451

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1452

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1453

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1454

}

1455

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1456

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1457

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1458

{

1459

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1460

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1461

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1462

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1463

TensorType rhs_reshaped;

1464

TensorType dst;

1465

1466

const unsigned int M = lhs_shape[1];

1467

const unsigned int N = rhs_shape[0];

1468

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1469

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1474

kernel_info.reinterpret_input_as_3d = false;

1475

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1476

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1477

1478

// The output tensor will be auto-initialized within the function

1479

1480

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1481

ReshapeRHSOperatorType reshape_rhs;

1482

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1483

1484

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1485

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1491

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1492

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1493

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1494

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1495

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1496

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1497

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1498

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1499

if(!rhs_info.export_to_cl_image)

1500

{

1501

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1502

}

1503

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1504

// Allocate tensors

1505

lhs.allocator()->allocate();

1506

rhs.allocator()->allocate();

1507

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1508

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1509

dst.allocator()->allocate();

1510

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1511

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1512

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1513

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1514

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1515

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1516

1517

// Fill tensors

1518

fill(AccessorType(lhs), 0);

1519

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1520

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1521

1522

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1523

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1524

reshape_rhs.run(reshape_rhs_pack);

1525

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1526

{ ACL_SRC_1, &rhs_reshaped },

1527

{ ACL_SRC_2, &bias },

1528

{ ACL_DST, &dst }

1529

});

1530

gemm.run(gemm_pack);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1535

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1536

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1537

{

1538

TensorShape dst_shape = lhs_shape;

1539

dst_shape[0] = rhs_shape[0];

1540

dst_shape[1] = lhs_shape[1];

1541

1542

// Create reference

1543

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1544

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1545

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1546

1547

const int n = rhs_shape[0];

1548

const int m = lhs_shape[1];

1549

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1554

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1555

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1556

if(broadcast_bias)

1557

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1558

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1559

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1560

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1561

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1562

}

1563

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1564

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1565

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1566

}

1567

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1568

bool validate_result = true;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1569

TensorType _target{};

1570

SimpleTensor<T> _reference{};

1571

};

1572

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

1573

/** (EXPERIMENTAL_POST_OPS)*/

1574

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

1575

class GEMMMatrixMultiplyReshapedOnlyRHSWithPostOpsValidationFixture : public framework::Fixture

1576

{

1577

public:

1578

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

1579

template <typename...>

1580

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

1581

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info,

1582

const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

1583

{

1584

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1593

rhs_info.transpose = transpose_rhs;

1594

rhs_info.export_to_cl_image = export_to_cl_image;

1595

1596

// Set the tensor shapes for LHS and RHS matrices

1597

const TensorShape lhs_shape(k, m, batch_size);

1598

const TensorShape rhs_shape(n, k, batch_size);

1599

const TensorShape bias_shape(n,

1600

broadcast_bias ? 1 : m,

1601

broadcast_bias ? 1 : batch_size);

1602

auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

1603

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

1608

std::get<1>(broadcast) ? 1 : m,

1609

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

1614

if(validate_result)

1615

{

1616

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

}

protected:

template <typename U>

1622

void fill(U &&tensor, int i)

1623

{

1624

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

1625

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

1626

1627

DistributionType distribution{ T(-1.0f), T(1.0f) };

1628

library->fill(tensor, distribution, i);

1629

1630

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1631

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

1632

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1633

}

1634

1635

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1636

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1637

{

1638

// Create tensors

1639

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1640

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1641

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1642

TensorType rhs_reshaped;

1643

TensorType dst;

1644

// Create post op tensors and populate post op with them

1645

std::vector<TensorType> post_op_tensors_holder{};

1646

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

1647

[&post_op_tensors_holder, &data_type](auto shape)

1648

{

1649

auto t = create_tensor<TensorType>(shape, data_type, 1);

1650

post_op_tensors_holder.push_back(std::move(t));

1651

return post_op_tensors_holder.back().info();

1652

});

1653

1654

const unsigned int M = lhs_shape[1];

1655

const unsigned int N = rhs_shape[0];

1656

const unsigned int K = lhs_shape[0];

1657

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1662

kernel_info.reinterpret_input_as_3d = false;

1663

kernel_info.broadcast_bias = broadcast_bias;

1664

kernel_info.activation_info = act_info;

1665

kernel_info.post_ops = populated_post_ops;

1666

1667

// The output tensor will be auto-initialized within the function

1668

1669

// Create and configure function

1670

ReshapeRHSOperatorType reshape_rhs;

1671

GEMMOperatorType gemm;

1672

1673

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1674

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1681

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

1682

1683

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1684

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1685

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1686

for(const auto &tensor : post_op_tensors_holder)

1687

{

1688

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

1689

}

1690

1691

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

1692

if(!rhs_info.export_to_cl_image)

1693

{

1694

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1695

for(auto &tensor : post_op_tensors_holder)

1696

{

1697

add_padding_x({ &tensor });

}

}

// Allocate tensors

lhs.allocator()->allocate();

1703

rhs.allocator()->allocate();

1704

rhs_reshaped.allocator()->allocate();

1705

bias.allocator()->allocate();

1706

dst.allocator()->allocate();

1707

for(auto &tensor : post_op_tensors_holder)

1708

{

1709

tensor.allocator()->allocate();

1710

}

1711

1712

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1713

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1714

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1715

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1716

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1717

for(const auto &tensor : post_op_tensors_holder)

1718

{

1719

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

1724

fill(AccessorType(rhs), 1);

1725

fill(AccessorType(bias), 2);

1726

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1727

{

1728

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1733

reshape_rhs.run(reshape_rhs_pack);

1734

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1735

{ ACL_SRC_1, &rhs_reshaped },

1736

{ ACL_SRC_2, &bias },

1737

{ ACL_DST, &dst }

1738

});

1739

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1740

{

1741

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1749

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1750

{

1751

TensorShape dst_shape = lhs_shape;

1752

dst_shape[0] = rhs_shape[0];

1753

dst_shape[1] = lhs_shape[1];

1754

1755

// Create reference

1756

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1757

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1758

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1759

// Create post op tensors and populate post op with them

1760

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

1761

{

1762

return SimpleTensor<T> { shape, data_type, 1 };

1763

});

1764

1765

const int n = rhs_shape[0];

1766

const int m = lhs_shape[1];

1767

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

1772

fill(rhs, tensor_idx++);

1773

fill(bias, tensor_idx++);

1774

for(auto &op : populated_post_ops.get_list())

1775

{

1776

for(auto tensor : op->arguments())

1777

{

1778

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1784

// In case of broadcast, we need to simply copy the first into the following "M" ones

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

1785

for(int i = 1; i < m * batch_size; i++)

1786

{

1787

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

1793

// Ignore activation info if post ops are used instead

1794

if(populated_post_ops.size() > 0)

1795

{

1796

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

bool validate_result = true;

1806

TensorType _target{};

1807

SimpleTensor<T> _reference{};

1808

};

1809

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1810

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1811

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1812

{

1813

public:

1814

template <typename...>

1815

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1816

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, bool has_pad_y, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1817

{

1818

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1827

rhs_info.transpose = transpose_rhs;

1828

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1829

1830

// In case of GEMM3D, m is the product between m_w and m_h

1831

const unsigned int m = m_w * m_h;

1832

1833

// Set the tensor shapes for LHS and RHS matrices

1834

const TensorShape lhs_shape(k, m, batch_size);

1835

const TensorShape rhs_shape(n, k, batch_size);

1836

const TensorShape bias_shape(n, 1, 1);

1837

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1838

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info, has_pad_y);

1839

if(validate_result)

1840

{

1841

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1842

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1847

void fill(U &&tensor, int i)

1848

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1849

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1850

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1851

1852

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1853

library->fill(tensor, distribution, i);

1854

}

1855

1856

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1857

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1858

unsigned int m_h, const ActivationLayerInfo &act_info, bool has_pad_y)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1859

{

1860

// Create tensors

1861

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1862

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1863

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1864

TensorType rhs_reshaped;

1865

TensorType dst;

1866

1867

const unsigned int M = lhs_shape[1];

1868

const unsigned int N = rhs_shape[0];

1869

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1870

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1875

kernel_info.reinterpret_input_as_3d = false;

1876

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1877

kernel_info.activation_info = act_info;

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1878

kernel_info.has_pad_y = has_pad_y;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1879

1880

// The output tensor will be auto-initialized within the function

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1881

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1882

ReshapeRHSOperatorType reshape_rhs;

1883

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1884

1885

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1886

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1892

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1893

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1894

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1895

if(has_pad_y)

1896

{

1897

// Add dummy padding into lhs to validate has_pad_y path

1898

lhs.info()->extend_padding(PaddingSize(2, 0, 2, 0));

1899

dst.info()->extend_padding(PaddingSize(2, 0, 1, 0));

1900

}

1901

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1902

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1903

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1904

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1905

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1906

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1907

if(!rhs_info.export_to_cl_image)

1908

{

1909

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1910

}

1911

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1912

// Allocate tensors

1913

lhs.allocator()->allocate();

1914

rhs.allocator()->allocate();

1915

rhs_reshaped.allocator()->allocate();

1916

bias.allocator()->allocate();

1917

dst.allocator()->allocate();

1918

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1919

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1920

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1921

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1922

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1923

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1924

1925

// Fill tensors

1926

fill(AccessorType(lhs), 0);

1927

fill(AccessorType(rhs), 1);

1928

fill(AccessorType(bias), 2);

1929

1930

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1931

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1932

reshape_rhs.run(reshape_rhs_pack);

1933

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1934

{ ACL_SRC_1, &rhs_reshaped },

1935

{ ACL_SRC_2, &bias },

1936

{ ACL_DST, &dst }

1937

});

1938

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1943

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1944

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1945

{

1946

TensorShape dst_shape = lhs_shape;

1947

dst_shape.set(0, rhs_shape[0]);

1948

dst_shape.set(1, lhs_shape[1] / m_h);

1949

dst_shape.set(2, m_h);

1950

dst_shape.set(3, lhs_shape[2]);

1951

1952

// Create reference

1953

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1954

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1955

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1956

1957

const int n = rhs_shape[0];

1958

const int m = lhs_shape[1];

1959

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1966

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1967

for(int i = 1; i < m * batch_size; i++)

1968

{

1969

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1970

}

1971

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1972

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1973

}

1974

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1975

bool validate_result = true;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1976

TensorType _target{};

1977

SimpleTensor<T> _reference{};

1978

};

1979

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1980

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1981

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1982

{

1983

public:

1984

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1985

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1986

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1987

{

1988

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1997

const TensorShape lhs_shape(k, m, batch_size);

1998

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1999

const TensorShape bias_shape(n,

2000

broadcast_bias ? 1 : m,

2001

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2002

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2003

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2004

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

2009

void fill(U &&tensor, int i)

2010

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2011

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

2012

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2013

2014

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2015

library->fill(tensor, distribution, i);

2016

2017

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2018

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2019

library->fill_borders_with_garbage(tensor, distribution_inf, i);

2020

}

2021

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2022

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2023

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2024

{

2025

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2026

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2027

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2028

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2029

TensorType dst;

2030

2031

const unsigned int M = lhs_shape[1];

2032

const unsigned int N = rhs_shape[0];

2033

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

2034

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

2039

kernel_info.reinterpret_input_as_3d = false;

2040

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2041

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2042

2043

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2044

GEMMOperatorType gemm;

2045

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2046

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2047

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2048

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2049

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2050

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2051

add_padding_x({ &lhs, &rhs, &bias, &dst });

2052

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2053

// Allocate tensors

2054

lhs.allocator()->allocate();

2055

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2056

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2057

dst.allocator()->allocate();

2058

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2059

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2060

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2061

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2062

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2063

2064

// Fill tensors

2065

fill(AccessorType(lhs), 0);

2066

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2067

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2068

2069

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2070

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2071

{ ACL_SRC_1, &rhs },

2072

{ ACL_SRC_2, &bias },

2073

{ ACL_DST, &dst }

2074

});

2075

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2080

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2081

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2082

{

2083

TensorShape dst_shape = lhs_shape;

2084

dst_shape[0] = rhs_shape[0];

2085

dst_shape[1] = lhs_shape[1];

2086

2087

// Create reference

2088

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2089

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2090

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2091

2092

const int n = rhs_shape[0];

2093

const int m = lhs_shape[1];

2094

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2099

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2100

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2101

if(broadcast_bias)

2102

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

2103

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2104

for(int i = 1; i < m * batch_size; i++)

2105

{

2106

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2110

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2111

}

2112

2113

TensorType _target{};

2114

SimpleTensor<T> _reference{};

2115

};

2116

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2117

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

2118

class GEMMMatrixMultiplyNativeWithPostOpsValidationFixture : public framework::Fixture

2119

{

2120

public:

2121

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

2122

public:

2123

template <typename...>

2124

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

2125

const ActivationLayerInfo &act_info, const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

2126

{

2127

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

2136

const TensorShape lhs_shape(k, m, batch_size);

2137

const TensorShape rhs_shape(n, k, batch_size);

2138

const TensorShape bias_shape(n,

2139

broadcast_bias ? 1 : m,

2140

broadcast_bias ? 1 : batch_size);

2141

const auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

2142

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

2147

std::get<1>(broadcast) ? 1 : m,

2148

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

2153

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

protected:

template <typename U>

2158

void fill(U &&tensor, int i)

2159

{

2160

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

2161

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

2162

2163

DistributionType distribution{ T(-1.0f), T(1.0f) };

2164

library->fill(tensor, distribution, i);

2165

2166

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

2167

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

2168

library->fill_borders_with_garbage(tensor, distribution_inf, i);

2169

}

2170

2171

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

2172

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

2173

{

2174

// Create tensors

2175

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2176

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2177

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

2178

TensorType dst;

2179

// Create post op tensors and populate post op with them

2180

std::vector<TensorType> post_op_tensors_holder{};

2181

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

2182

[&post_op_tensors_holder, &data_type](auto shape)

2183

{

2184

auto t = create_tensor<TensorType>(shape, data_type, 1);

2185

post_op_tensors_holder.push_back(std::move(t));

2186

return post_op_tensors_holder.back().info();

2187

});

2188

2189

const unsigned int M = lhs_shape[1];

2190

const unsigned int N = rhs_shape[0];

2191

const unsigned int K = lhs_shape[0];

2192

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

2197

kernel_info.reinterpret_input_as_3d = false;

2198

kernel_info.broadcast_bias = broadcast_bias;

2199

kernel_info.activation_info = act_info;

2200

kernel_info.post_ops = populated_post_ops;

2201

2202

// Create and configure function

2203

GEMMOperatorType gemm;

2204

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

2205

2206

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2207

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2208

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

2209

for(const auto &tensor : post_op_tensors_holder)

2210

{

2211

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

2212

}

2213

2214

add_padding_x({ &lhs, &rhs, &bias, &dst });

2215

for(auto &tensor : post_op_tensors_holder)

2216

{

2217

add_padding_x({ &tensor });

}

// Allocate tensors

lhs.allocator()->allocate();

2222

rhs.allocator()->allocate();

2223

bias.allocator()->allocate();

2224

dst.allocator()->allocate();

2225

for(auto &tensor : post_op_tensors_holder)

2226

{

2227

tensor.allocator()->allocate();

2228

}

2229

2230

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2231

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2232

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2233

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

2234

for(const auto &tensor : post_op_tensors_holder)

2235

{

2236

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

2241

fill(AccessorType(rhs), 1);

2242

fill(AccessorType(bias), 2);

2243

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

2244

{

2245

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2250

{ ACL_SRC_1, &rhs },

2251

{ ACL_SRC_2, &bias },

2252

{ ACL_DST, &dst }

2253

});

2254

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

2255

{

2256

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

2264

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

2265

{

2266

TensorShape dst_shape = lhs_shape;

2267

dst_shape[0] = rhs_shape[0];

2268

dst_shape[1] = lhs_shape[1];

2269

2270

// Create reference

2271

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2272

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

2273

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2274

// Create post op tensors and populate post op with them

2275

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

2276

{

2277

return SimpleTensor<T> { shape, data_type, 1 };

2278

});

2279

2280

const int n = rhs_shape[0];

2281

const int m = lhs_shape[1];

2282

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

2287

fill(rhs, tensor_idx++);

2288

fill(bias, tensor_idx++);

2289

for(auto &op : populated_post_ops.get_list())

2290

{

2291

for(auto tensor : op->arguments())

2292

{

2293

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

2299

// In case of broadcast, we need to simply copy the first into the following "M" ones

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

2300

for(int i = 1; i < m * batch_size; i++)

2301

{

2302

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

2308

// Ignore activation info if post ops are used instead

2309

if(populated_post_ops.size() > 0)

2310

{

2311

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

TensorType _target{};

2321

SimpleTensor<T> _reference{};

2322

};

2323

2324

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2325

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

2326

{

2327

public:

2328

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2329

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

2330

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2331

{

2332

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

2341

const unsigned int m = m_w * m_h;

2342

2343

// Set the tensor shapes for LHS and RHS matrices

2344

const TensorShape lhs_shape(k, m, batch_size);

2345

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2346

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2347

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2348

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2349

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

2354

void fill(U &&tensor, int i)

2355

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2356

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

2357

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2358

2359

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2360

library->fill(tensor, distribution, i);

2361

}

2362

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2363

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2364

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2365

{

2366

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2367

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2368

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2369

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2370

TensorType dst;

2371

2372

const unsigned int M = lhs_shape[1];

2373

const unsigned int N = rhs_shape[0];

2374

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

2375

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

2380

kernel_info.reinterpret_input_as_3d = false;

2381

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2382

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2383

2384

// The output tensor will be auto-initialized within the function

2385

2386

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2387

GEMMOperatorType gemm;

2388

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2389

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2390

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2391

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2392

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2393

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2394

add_padding_x({ &lhs, &rhs, &bias, &dst });

2395

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2396

// Allocate tensors

2397

lhs.allocator()->allocate();

2398

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2399

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2400

dst.allocator()->allocate();

2401

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2402

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2403

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2404

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2405

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2406

2407

// Fill tensors

2408

fill(AccessorType(lhs), 0);

2409

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2410

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2411

2412

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2413

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2414

{ ACL_SRC_1, &rhs },

2415

{ ACL_SRC_2, &bias },

2416

{ ACL_DST, &dst }

2417

});

2418

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2423

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2424

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2425

{

2426

TensorShape dst_shape = lhs_shape;

2427

dst_shape.set(0, rhs_shape[0]);

2428

dst_shape.set(1, lhs_shape[1] / m_h);

2429

dst_shape.set(2, m_h);

2430

dst_shape.set(3, lhs_shape[2]);

2431

2432

// Create reference

2433

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2434

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2435

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2436

2437

const int n = rhs_shape[0];

2438

const int m = lhs_shape[1];

2439

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2444

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2445

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

2446

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2447

for(int i = 1; i < m * batch_size; i++)

2448

{

2449

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

2450

}

2451

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2452

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2453

}

2454

2455

TensorType _target{};

2456

SimpleTensor<T> _reference{};

2457

};

2458

Gunes Bayir