Blame - tests/validation/fixtures/GEMMFixture.h - ml/ComputeLibrary

2018-07-26 11:44:03 +0100

[diff] [blame]

52

class GEMMValidationFixture : public framework::Fixture

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

53

{

54

public:

55

template <typename...>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

56

void setup(TensorShape shape_a, TensorShape shape_b, TensorShape shape_c, TensorShape output_shape, float alpha, float beta, bool pretranspose, DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

57

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

58

ARM_COMPUTE_UNUSED(pretranspose);

59

_target = compute_target(shape_a, shape_b, shape_c, output_shape, alpha, beta, data_type);

60

_reference = compute_reference(shape_a, shape_b, output_shape, alpha, beta, data_type);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

}

protected:

template <typename U>

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

65

void fill(U &&tensor, int i, float lo = -1.f, float hi = 1.f)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

66

{

67

switch(tensor.data_type())

68

{

69

case DataType::F16:

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

70

{

Giorgio Arena

a8e2aeb

2021-01-06 11:34:57 +0000

[diff] [blame]

71

arm_compute::utils::uniform_real_distribution_16bit<half> distribution{ float(lo), float(hi) };

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

72

library->fill(tensor, distribution, i);

73

break;

74

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

75

case DataType::F32:

76

{

Giorgio Arena

6aeb217

2020-12-15 15:45:43 +0000

[diff] [blame]

77

std::uniform_real_distribution<float> distribution(lo, hi);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

78

library->fill(tensor, distribution, i);

break;

}

default:

library->fill_tensor_uniform(tensor, i);

}

}

TensorType compute_target(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &shape_c, const TensorShape &output_shape, float alpha, float beta,

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

87

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

88

{

89

// Create tensors

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

90

TensorType a = create_tensor<TensorType>(shape_a, data_type, 1);

91

TensorType b = create_tensor<TensorType>(shape_b, data_type, 1);

92

TensorType c = create_tensor<TensorType>(shape_c, data_type, 1);

93

TensorType dst = create_tensor<TensorType>(output_shape, data_type, 1);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

94

95

// Create and configure function

96

FunctionType gemm;

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

97

// The GEMMinfo includes the values of the depth in case of reinterpreted 3d output.

Gian Marco Iodice

3139f03

2018-11-05 14:26:32 +0000

[diff] [blame]

98

// If the output shape has the same number of dimensions of the input the method called is a 2D matrix multiplication (depth_output_reinterpreted_as_3D = 0),

Isabella Gottardi

8e74f44

2018-03-01 16:42:00 +0000

[diff] [blame]

99

// in the other case we have to use the reinterpreted version of GEMM (depth_output_reinterpreted_as_3D = depth of the 3D output).

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

100

gemm.configure(&a,

101

&b,

102

(disable_c) ? nullptr : &c,

103

&dst,

104

alpha, beta,

Georgios Pinitas

4ee8b15

2021-07-16 16:16:43 +0100

[diff] [blame]

105

GEMMInfo(false, false, false, (reinterpret_output_as_3d ? output_shape[2] : 0), reinterpret_input_as_3d, false, GEMMLowpOutputStageInfo(), false, false, (reinterpret_input_as_3d

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

106

|| reinterpret_output_as_3d)));

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

107

ARM_COMPUTE_ASSERT(a.info()->is_resizable());

108

ARM_COMPUTE_ASSERT(b.info()->is_resizable());

109

ARM_COMPUTE_ASSERT(c.info()->is_resizable());

110

ARM_COMPUTE_ASSERT(dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

111

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

112

add_padding_x({ &a, &b, &c, &dst });

113

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

114

// Allocate tensors

115

a.allocator()->allocate();

116

b.allocator()->allocate();

117

c.allocator()->allocate();

118

dst.allocator()->allocate();

119

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

120

ARM_COMPUTE_ASSERT(!a.info()->is_resizable());

121

ARM_COMPUTE_ASSERT(!b.info()->is_resizable());

122

ARM_COMPUTE_ASSERT(!c.info()->is_resizable());

123

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

124

125

// Fill tensors

126

fill(AccessorType(a), 0);

127

fill(AccessorType(b), 1);

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

128

if(!disable_c)

129

{

130

fill(AccessorType(c), 2);

131

}

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

132

133

// Compute GEMM function

gemm.run();

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

139

SimpleTensor<T> compute_reference(const TensorShape &shape_a, const TensorShape &shape_b, const TensorShape &output_shape, float alpha, float beta,

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

140

DataType data_type)

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

141

{

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

142

TensorShape shape_a_to_use = shape_a;

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

143

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

144

if(reinterpret_input_as_3d)

145

{

146

// Collapse the second and third dimension if the input is 3D

147

shape_a_to_use.collapse(2U, 1U);

148

}

149

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

150

// Create reference

Gian Marco Iodice

2018-07-26 11:44:03 +0100

[diff] [blame]

151

SimpleTensor<T> a{ shape_a_to_use, data_type, 1 };

Vidhya Sudhan Loganathan

014333d

2018-07-02 09:13:49 +0100

[diff] [blame]

152

SimpleTensor<T> b{ shape_b, data_type, 1 };

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

153

SimpleTensor<T> c{ output_shape, data_type, 1 };

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

// Fill reference

fill(a, 0);

fill(b, 1);

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

158

fill(c, 2);

159

160

if(reinterpret_input_as_3d || reinterpret_output_as_3d)

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

161

{

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

162

const int n = shape_b[0];

163

const int m = reinterpret_output_as_3d ? output_shape[1] * output_shape[2] : output_shape[1];

164

const int batch_size = reinterpret_output_as_3d ? output_shape[3] : output_shape[2];

165

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

166

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

167

for(int i = 1; i < m * batch_size; i++)

168

{

169

memcpy(c.data() + i * n, c.data(), n * sizeof(T));

170

}

Pablo Tello

2018-10-30 11:18:37 +0000

[diff] [blame]

171

}

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

172

Adnan AlSinan

3bb72b6

2022-05-06 12:10:11 +0100

[diff] [blame]

173

/* Note: Assuming the usual batch matmul dimensions A = (B x M x K), B = (B x K x N), if pretranspose_A is set to true, then A is assumed to be (B x K x M),

174

therefore, A must be pre-transposed before passing it to the fixture. And, we transpose A again in the fixture to make it (B x M x K)

175

in order to be able to call reference implementation that works with (B x M x K) input.

176

Similarly, if pretranspose_B is set to true, then B is assumed to be (B x N x K), B must be pre-transposed before passing it to the fixture. */

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

177

Mohammed Suhail Munshi

bc5c407

2022-04-27 13:49:51 +0100

[diff] [blame]

178

// Define transposed shapes

179

TensorShape a_transposed_shape(a.shape().y(), a.shape().x());

180

TensorShape b_transposed_shape(b.shape().y(), b.shape().x());

181

182

// Define transposed tensors

183

SimpleTensor<T> a_transposed{ a_transposed_shape, data_type };

184

SimpleTensor<T> b_transposed{ b_transposed_shape, data_type };

185

186

// pretranspose a if necessary

187

if(pretranspose_a)

188

{

189

transpose_matrix<T>(a, a_transposed);

190

}

191

192

// pretranspose b if necessary

193

if(pretranspose_b)

194

{

195

transpose_matrix<T>(b, b_transposed);

196

}

197

Gian Marco Iodice

2019-07-29 14:27:16 +0100

[diff] [blame]

198

// Setting beta to 0 will effectively disable C for the

199

// computation of the reference: alpha * A * B + 0 * C

Mohammed Suhail Munshi

bc5c407

2022-04-27 13:49:51 +0100

[diff] [blame]

200

// Use transposed tensors if boolean enabled else use original tensors

201

return reference::gemm<T>((pretranspose_a) ? a_transposed : a, (pretranspose_b) ? b_transposed : b, c, alpha, disable_c ? 0.f : beta);

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

202

}

203

204

TensorType _target{};

205

SimpleTensor<T> _reference{};

Moritz Pflanzer

2017-08-02 14:51:36 +0100

[diff] [blame]

206

};

207

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

208

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

209

class GEMMMatrixMultiplyValidationFixture : public framework::Fixture

210

{

211

public:

212

template <typename...>

213

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info,

214

DataType data_type, GPUTarget gpu_arch)

215

{

216

// Set the tensor shapes for LHS and RHS matrices

217

const TensorShape lhs_shape(k, m, batch_size);

218

const TensorShape rhs_shape(n, k, batch_size);

219

const TensorShape bias_shape(n,

220

broadcast_bias ? 1 : m,

221

broadcast_bias ? 1 : batch_size);

222

223

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

224

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

229

void fill(U &&tensor, int i)

230

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

231

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

232

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

233

234

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

235

library->fill(tensor, distribution, i);

236

237

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

238

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

239

library->fill_borders_with_garbage(tensor, distribution_inf, i);

240

}

241

242

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

243

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

244

{

245

// Create tensors

246

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

247

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

248

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

249

TensorType dst;

250

251

const unsigned int m = lhs_shape[1];

252

const unsigned int n = rhs_shape[0];

253

const unsigned int k = lhs_shape[0];

254

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, 0, false, broadcast_bias);

255

256

// The output tensor will be auto-initialized within the function

257

258

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

259

GEMMOperatorType gemm;

260

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

261

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

262

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

263

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

264

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

265

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

266

add_padding_x({ &lhs, &rhs, &bias, &dst });

267

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

268

// Allocate tensors

269

lhs.allocator()->allocate();

270

rhs.allocator()->allocate();

271

bias.allocator()->allocate();

272

dst.allocator()->allocate();

273

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

274

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

275

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

276

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

277

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

278

279

// Fill tensors

280

fill(AccessorType(lhs), 0);

281

fill(AccessorType(rhs), 1);

282

fill(AccessorType(bias), 2);

283

284

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

285

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

286

{ ACL_SRC_1, &rhs },

287

{ ACL_SRC_2, &bias },

288

{ ACL_DST, &dst }

289

});

290

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

295

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

296

const ActivationLayerInfo &act_info)

297

{

298

TensorShape dst_shape = lhs_shape;

299

dst_shape[0] = rhs_shape[0];

300

dst_shape[1] = lhs_shape[1];

301

302

// Create reference

303

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

304

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

305

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

306

307

const int n = rhs_shape[0];

308

const int m = lhs_shape[1];

309

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

318

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

319

for(int i = 1; i < m * batch_size; i++)

320

{

321

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

326

}

327

328

TensorType _target{};

329

SimpleTensor<T> _reference{};

330

};

331

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

332

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

333

class GEMMMatrixMultiply3DValidationFixture : public framework::Fixture

334

{

335

public:

336

template <typename...>

337

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision,

338

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

339

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

340

ARM_COMPUTE_UNUSED(broadcast_bias);

341

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

342

// In case of GEMM3D, m is the product between m_w and m_h

343

const unsigned int m = m_w * m_h;

344

345

// Set the tensor shapes for LHS and RHS matrices

346

const TensorShape lhs_shape(k, m, batch_size);

347

const TensorShape rhs_shape(n, k, batch_size);

348

const TensorShape bias_shape(n, 1, 1);

349

350

_target = compute_target(lhs_shape, rhs_shape, bias_shape, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

351

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

356

void fill(U &&tensor, int i)

357

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

358

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

359

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

360

361

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

362

library->fill(tensor, distribution, i);

363

}

364

365

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

366

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

367

{

368

// Create tensors

369

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

370

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

371

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

372

TensorType dst;

373

374

const unsigned int m = lhs_shape[1];

375

const unsigned int n = rhs_shape[0];

376

const unsigned int k = lhs_shape[0];

377

GEMMReshapeInfo reshape_info(m, n, k, 1, 1, m_h, false, true);

378

379

// The output tensor will be auto-initialized within the function

380

381

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

382

GEMMOperatorType gemm;

383

gemm.configure(gpu_arch, lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, false, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

384

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

385

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

386

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

387

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

388

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

389

add_padding_x({ &lhs, &rhs, &bias, &dst });

390

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

391

// Allocate tensors

392

lhs.allocator()->allocate();

393

rhs.allocator()->allocate();

394

bias.allocator()->allocate();

395

dst.allocator()->allocate();

396

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

397

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

398

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

399

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

400

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

401

402

// Fill tensors

403

fill(AccessorType(lhs), 0);

404

fill(AccessorType(rhs), 1);

405

fill(AccessorType(bias), 2);

406

407

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

408

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

409

{ ACL_SRC_1, &rhs },

410

{ ACL_SRC_2, &bias },

411

{ ACL_DST, &dst }

412

});

413

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

418

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

419

const ActivationLayerInfo &act_info)

420

{

421

TensorShape dst_shape = lhs_shape;

422

dst_shape.set(0, rhs_shape[0]);

423

dst_shape.set(1, lhs_shape[1] / m_h);

424

dst_shape.set(2, m_h);

425

dst_shape.set(3, lhs_shape[2]);

426

427

// Create reference

428

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

429

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

430

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

431

432

const int n = rhs_shape[0];

433

const int m = lhs_shape[1];

434

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

441

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

442

for(int i = 1; i < m * batch_size; i++)

443

{

444

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

445

}

446

447

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

448

}

449

450

TensorType _target{};

451

SimpleTensor<T> _reference{};

452

};

453

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

454

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

455

class GEMMMatrixMultiplyInterleavedTransposedValidationFixture : public framework::Fixture

456

{

457

public:

458

template <typename...>

459

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias, bool fp16_mixed_precision,

460

const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

461

{

462

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

467

lhs_info.transpose = true;

468

469

GEMMRHSMatrixInfo rhs_info;

470

rhs_info.n0 = 16 / sizeof(T);

471

rhs_info.k0 = 1;

472

rhs_info.h0 = h0;

473

rhs_info.interleave = false;

474

rhs_info.transpose = false;

475

476

// Set the tensor shapes for LHS and RHS matrices

477

const TensorShape lhs_shape(k, m, batch_size);

478

const TensorShape rhs_shape(n, k, batch_size);

479

const TensorShape bias_shape(n,

480

broadcast_bias ? 1 : m,

481

broadcast_bias ? 1 : batch_size);

482

483

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

484

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

489

void fill(U &&tensor, int i)

490

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

491

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

492

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

493

494

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

495

library->fill(tensor, distribution, i);

496

497

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

498

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

499

library->fill_borders_with_garbage(tensor, distribution_inf, i);

500

}

501

502

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

503

DataType data_type, float alpha, float beta, bool broadcast_bias, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

504

{

505

// Create tensors

506

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

507

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

508

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

509

TensorType lhs_reshaped;

510

TensorType rhs_reshaped;

511

TensorType dst;

512

513

const unsigned int m = lhs_shape[1];

514

const unsigned int n = rhs_shape[0];

515

const unsigned int k = lhs_shape[0];

516

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, 0, false, broadcast_bias);

517

518

// The output tensor will be auto-initialized within the function

519

520

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

521

ReshapeLHSOperatorType reshape_lhs;

522

ReshapeRHSOperatorType reshape_rhs;

523

GEMMOperatorType gemm;

524

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

525

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

526

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

527

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

528

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

529

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

530

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

531

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

532

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

533

if(!rhs_info.export_to_cl_image)

534

{

535

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

536

}

537

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

538

// Allocate tensors

539

lhs.allocator()->allocate();

540

rhs.allocator()->allocate();

541

lhs_reshaped.allocator()->allocate();

542

rhs_reshaped.allocator()->allocate();

543

bias.allocator()->allocate();

544

dst.allocator()->allocate();

545

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

546

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

547

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

548

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

549

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

550

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

551

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

552

553

// Fill tensors

554

fill(AccessorType(lhs), 0);

555

fill(AccessorType(rhs), 1);

556

fill(AccessorType(bias), 2);

557

558

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

559

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

560

reshape_lhs.run(reshape_lhs_pack);

561

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

562

reshape_rhs.run(reshape_rhs_pack);

563

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

564

{ ACL_SRC_1, &rhs_reshaped },

565

{ ACL_SRC_2, &bias },

566

{ ACL_DST, &dst }

567

});

568

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

573

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

574

const ActivationLayerInfo &act_info)

575

{

576

TensorShape dst_shape = lhs_shape;

577

dst_shape[0] = rhs_shape[0];

578

dst_shape[1] = lhs_shape[1];

579

580

// Create reference

581

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

582

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

583

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

584

585

const int n = rhs_shape[0];

586

const int m = lhs_shape[1];

587

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

596

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

597

for(int i = 1; i < m * batch_size; i++)

598

{

599

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

604

}

605

606

TensorType _target{};

607

SimpleTensor<T> _reference{};

608

};

609

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

610

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

611

class GEMMMatrixMultiplyInterleavedTransposed3DValidationFixture : public framework::Fixture

612

{

613

public:

614

template <typename...>

615

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, float alpha, float beta, unsigned int v0, unsigned int h0, bool broadcast_bias,

616

bool fp16_mixed_precision, const ActivationLayerInfo &act_info, DataType data_type, GPUTarget gpu_arch)

617

{

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

618

ARM_COMPUTE_UNUSED(broadcast_bias);

619

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

620

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = 4;

lhs_info.k0 = 4;

lhs_info.v0 = v0;

lhs_info.interleave = true;

625

lhs_info.transpose = true;

626

627

GEMMRHSMatrixInfo rhs_info;

628

rhs_info.n0 = 16 / sizeof(T);

629

rhs_info.k0 = 1;

630

rhs_info.h0 = h0;

631

rhs_info.interleave = false;

632

rhs_info.transpose = false;

633

634

// In case of GEMM3D, m is the product between m_w and m_h

635

const unsigned int m = m_w * m_h;

636

637

// Set the tensor shapes for LHS and RHS matrices

638

const TensorShape lhs_shape(k, m, batch_size);

639

const TensorShape rhs_shape(n, k, batch_size);

640

const TensorShape bias_shape(n, 1, 1);

641

642

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, fp16_mixed_precision, act_info, gpu_arch);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

643

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

}

protected:

template <typename U>

648

void fill(U &&tensor, int i)

649

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

650

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

651

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

652

653

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

654

library->fill(tensor, distribution, i);

655

}

656

657

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

658

DataType data_type, float alpha, float beta, unsigned int m_h, bool fp16_mixed_precision, const ActivationLayerInfo &act_info, GPUTarget gpu_arch)

659

{

660

// Create tensors

661

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

662

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

663

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

664

TensorType lhs_reshaped;

665

TensorType rhs_reshaped;

666

TensorType dst;

667

668

const unsigned int m = lhs_shape[1];

669

const unsigned int n = rhs_shape[0];

670

const unsigned int k = lhs_shape[0];

671

GEMMReshapeInfo reshape_info(m, n, k, rhs_info.h0, lhs_info.v0, m_h, false, true);

672

673

// The output tensor will be auto-initialized within the function

674

675

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

676

ReshapeLHSOperatorType reshape_lhs;

677

ReshapeRHSOperatorType reshape_rhs;

678

GEMMOperatorType gemm;

679

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

680

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

681

gemm.configure(gpu_arch, lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, true, reshape_info, fp16_mixed_precision, act_info);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

682

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

683

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

684

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

685

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

686

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

687

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

688

if(!rhs_info.export_to_cl_image)

689

{

690

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

691

}

692

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

693

// Allocate tensors

694

lhs.allocator()->allocate();

695

rhs.allocator()->allocate();

696

lhs_reshaped.allocator()->allocate();

697

rhs_reshaped.allocator()->allocate();

698

bias.allocator()->allocate();

699

dst.allocator()->allocate();

700

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

701

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

702

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

703

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

704

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

705

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

706

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

707

708

// Fill tensors

709

fill(AccessorType(lhs), 0);

710

fill(AccessorType(rhs), 1);

711

fill(AccessorType(bias), 2);

712

713

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

714

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

715

reshape_lhs.run(reshape_lhs_pack);

716

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

717

reshape_rhs.run(reshape_rhs_pack);

718

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

719

{ ACL_SRC_1, &rhs_reshaped },

720

{ ACL_SRC_2, &bias },

721

{ ACL_DST, &dst }

722

});

723

gemm.run(gemm_pack);

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

728

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

729

const ActivationLayerInfo &act_info)

730

{

731

TensorShape dst_shape = lhs_shape;

732

dst_shape.set(0, rhs_shape[0]);

733

dst_shape.set(1, lhs_shape[1] / m_h);

734

dst_shape.set(2, m_h);

735

dst_shape.set(3, lhs_shape[2]);

736

737

// Create reference

738

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

739

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

740

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

741

742

const int n = rhs_shape[0];

743

const int m = lhs_shape[1];

744

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

751

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-07-19 09:54:47 +0100

[diff] [blame]

752

for(int i = 1; i < m * batch_size; i++)

753

{

754

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

755

}

756

757

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

758

}

759

760

TensorType _target{};

761

SimpleTensor<T> _reference{};

762

};

763

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

764

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

765

class GEMMMatrixMultiplyReshapedValidationFixture : public framework::Fixture

766

{

767

public:

768

template <typename...>

769

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

770

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

771

{

772

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

777

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

778

779

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

784

rhs_info.transpose = !lhs_transpose;

785

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

786

787

// Set the tensor shapes for LHS and RHS matrices

788

const TensorShape lhs_shape(k, m, batch_size);

789

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

790

const TensorShape bias_shape(n,

791

broadcast_bias ? 1 : m,

792

broadcast_bias ? 1 : batch_size);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

793

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

794

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

795

if(validate_result)

796

{

797

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

798

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

}

protected:

template <typename U>

803

void fill(U &&tensor, int i)

804

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

805

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

806

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

807

808

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

809

library->fill(tensor, distribution, i);

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

810

811

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

812

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

b87b95e

2019-01-21 17:14:31 +0000

[diff] [blame]

813

library->fill_borders_with_garbage(tensor, distribution_inf, i);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

814

}

815

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

816

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

817

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

818

{

819

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

820

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

821

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

822

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

823

TensorType lhs_reshaped;

824

TensorType rhs_reshaped;

825

TensorType dst;

826

827

const unsigned int M = lhs_shape[1];

828

const unsigned int N = rhs_shape[0];

829

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

830

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

835

kernel_info.reinterpret_input_as_3d = false;

836

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

837

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

838

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

839

840

// The output tensor will be auto-initialized within the function

841

842

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

843

ReshapeLHSOperatorType reshape_lhs;

844

ReshapeRHSOperatorType reshape_rhs;

845

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

846

847

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

848

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

854

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

855

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

856

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

857

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

858

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

859

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

860

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

861

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

862

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

863

if(!rhs_info.export_to_cl_image)

864

{

865

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

866

}

867

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

868

// Allocate tensors

869

lhs.allocator()->allocate();

870

rhs.allocator()->allocate();

871

lhs_reshaped.allocator()->allocate();

872

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

873

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

874

dst.allocator()->allocate();

875

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

876

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

877

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

878

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

879

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

880

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

881

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

882

883

// Fill tensors

884

fill(AccessorType(lhs), 0);

885

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

886

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

887

888

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

889

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

890

reshape_lhs.run(reshape_lhs_pack);

891

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

892

reshape_rhs.run(reshape_rhs_pack);

893

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

894

{ ACL_SRC_1, &rhs_reshaped },

895

{ ACL_SRC_2, &bias },

896

{ ACL_DST, &dst }

897

});

898

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

903

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

904

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

905

{

906

TensorShape dst_shape = lhs_shape;

907

dst_shape[0] = rhs_shape[0];

908

dst_shape[1] = lhs_shape[1];

909

910

// Create reference

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

911

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

912

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

913

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

914

915

const int n = rhs_shape[0];

916

const int m = lhs_shape[1];

917

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

922

fill(bias, 2);

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

923

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

924

if(broadcast_bias)

925

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

926

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

927

for(int i = 1; i < m * batch_size; i++)

928

{

929

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-09-27 09:23:15 +0100

[diff] [blame]

933

if(fp_mixed_precision)

934

{

935

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

940

}

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

941

}

942

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

943

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

944

TensorType _target{};

945

SimpleTensor<T> _reference{};

946

};

947

SiCongLi

1af5416

2021-10-06 15:25:57 +0100

[diff] [blame]

948

/** (EXPERIMENTAL_POST_OPS)*/

949

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

950

class GEMMMatrixMultiplyReshapedWithPostOpsValidationFixture : public framework::Fixture

951

{

952

public:

953

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

954

public:

955

template <typename...>

956

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0, bool interleave_lhs,

957

bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, bool lhs_transpose, const ActivationLayerInfo &act_info,

958

const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

959

{

960

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

965

lhs_info.transpose = lhs_transpose;

966

967

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

972

rhs_info.transpose = !lhs_transpose;

973

rhs_info.export_to_cl_image = export_to_cl_image;

974

975

// Set the tensor shapes for LHS and RHS matrices

976

const TensorShape lhs_shape(k, m, batch_size);

977

const TensorShape rhs_shape(n, k, batch_size);

978

const TensorShape bias_shape(n,

979

broadcast_bias ? 1 : m,

980

broadcast_bias ? 1 : batch_size);

981

auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

982

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

987

std::get<1>(broadcast) ? 1 : m,

988

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

993

if(validate_result)

994

{

995

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

}

protected:

template <typename U>

1001

void fill(U &&tensor, int i)

1002

{

1003

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

1004

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

1005

1006

DistributionType distribution{ T(-1.0f), T(1.0f) };

1007

library->fill(tensor, distribution, i);

1008

1009

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1010

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

1011

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1012

}

1013

1014

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1015

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1016

{

1017

// Create tensors

1018

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1019

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1020

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1021

1022

// Create post op tensors and populate post op with them

1023

std::vector<TensorType> post_op_tensors_holder{};

1024

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

1025

[&post_op_tensors_holder, &data_type](auto shape)

1026

{

1027

auto t = create_tensor<TensorType>(shape, data_type, 1);

1028

post_op_tensors_holder.push_back(std::move(t));

1029

return post_op_tensors_holder.back().info();

1030

});

1031

TensorType lhs_reshaped;

1032

TensorType rhs_reshaped;

1033

TensorType dst;

1034

1035

const unsigned int M = lhs_shape[1];

1036

const unsigned int N = rhs_shape[0];

1037

const unsigned int K = lhs_shape[0];

1038

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1043

kernel_info.reinterpret_input_as_3d = false;

1044

kernel_info.broadcast_bias = broadcast_bias;

1045

kernel_info.activation_info = act_info;

1046

kernel_info.fp_mixed_precision = fp_mixed_precision;

1047

kernel_info.post_ops = populated_post_ops;

1048

1049

// The output tensor will be auto-initialized within the function

1050

1051

// Create and configure function

1052

ReshapeLHSOperatorType reshape_lhs;

1053

ReshapeRHSOperatorType reshape_rhs;

1054

GEMMOperatorType gemm;

1055

1056

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1057

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1064

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1065

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

1066

1067

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1068

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1069

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1070

for(const auto &tensor : post_op_tensors_holder)

1071

{

1072

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

1073

}

1074

1075

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

1076

if(!rhs_info.export_to_cl_image)

1077

{

1078

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1079

for(auto &tensor : post_op_tensors_holder)

1080

{

1081

add_padding_x({ &tensor });

}

}

// Allocate tensors

lhs.allocator()->allocate();

1087

rhs.allocator()->allocate();

1088

lhs_reshaped.allocator()->allocate();

1089

rhs_reshaped.allocator()->allocate();

1090

bias.allocator()->allocate();

1091

dst.allocator()->allocate();

1092

for(auto &tensor : post_op_tensors_holder)

1093

{

1094

tensor.allocator()->allocate();

1095

}

1096

1097

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1098

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1099

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1100

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1101

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1102

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1103

for(const auto &tensor : post_op_tensors_holder)

1104

{

1105

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

1110

fill(AccessorType(rhs), 1);

1111

fill(AccessorType(bias), 2);

1112

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1113

{

1114

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1119

reshape_lhs.run(reshape_lhs_pack);

1120

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1121

reshape_rhs.run(reshape_rhs_pack);

1122

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1123

{ ACL_SRC_1, &rhs_reshaped },

1124

{ ACL_SRC_2, &bias },

1125

{ ACL_DST, &dst }

1126

});

1127

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1128

{

1129

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1137

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1138

{

1139

TensorShape dst_shape = lhs_shape;

1140

dst_shape[0] = rhs_shape[0];

1141

dst_shape[1] = lhs_shape[1];

1142

1143

// Create reference

1144

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1145

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1146

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1147

// Create post op tensors and populate post op with them

1148

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

1149

{

1150

return SimpleTensor<T> { shape, data_type, 1 };

1151

});

1152

1153

const int n = rhs_shape[0];

1154

const int m = lhs_shape[1];

1155

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

1160

fill(rhs, tensor_idx++);

1161

fill(bias, tensor_idx++);

1162

for(auto &op : populated_post_ops.get_list())

1163

{

1164

for(auto tensor : op->arguments())

1165

{

1166

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1172

// In case of broadcast, we need to simply copy the first into the following "M" ones

SiCongLi

1af5416

2021-10-06 15:25:57 +0100

[diff] [blame]

1173

for(int i = 1; i < m * batch_size; i++)

1174

{

1175

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

if(fp_mixed_precision)

1181

{

1182

out = reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta);

}

else

{

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

1187

}

1188

// Ignore activation info if post ops are used instead

1189

if(populated_post_ops.size() > 0)

1190

{

1191

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

bool validate_result = true;

1201

TensorType _target{};

1202

SimpleTensor<T> _reference{};

1203

};

1204

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1205

template <typename TensorType, typename AccessorType, typename T, typename ReshapeLHSOperatorType, typename ReshapeRHSOperatorType, typename GEMMOperatorType, bool fp_mixed_precision = false>

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1206

class GEMMMatrixMultiplyReshaped3DValidationFixture : public framework::Fixture

1207

{

1208

public:

1209

template <typename...>

1210

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int v0, unsigned int h0,

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

1211

bool interleave_lhs, bool interleave_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool lhs_transpose, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1212

{

1213

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

lhs_info.v0 = v0;

lhs_info.interleave = interleave_lhs;

Giorgio Arena

ae99b6e

2019-08-01 14:22:12 +0100

[diff] [blame]

1218

lhs_info.transpose = lhs_transpose;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1219

1220

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

2020-06-10 17:59:30 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1225

rhs_info.transpose = !lhs_transpose;

1226

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1227

1228

// In case of GEMM3D, m is the product between m_w and m_h

1229

const unsigned int m = m_w * m_h;

1230

1231

// Set the tensor shapes for LHS and RHS matrices

1232

const TensorShape lhs_shape(k, m, batch_size);

1233

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1234

const TensorShape bias_shape(n, 1, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1235

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1236

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

1237

if(validate_result)

1238

{

1239

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1240

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

}

protected:

template <typename U>

1245

void fill(U &&tensor, int i)

1246

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1247

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1248

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1249

1250

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1251

library->fill(tensor, distribution, i);

1252

}

1253

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1254

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1255

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1256

{

1257

// Create tensors

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1258

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1259

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1260

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1261

TensorType lhs_reshaped;

1262

TensorType rhs_reshaped;

1263

TensorType dst;

1264

1265

const unsigned int M = lhs_shape[1];

1266

const unsigned int N = rhs_shape[0];

1267

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1268

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1273

kernel_info.reinterpret_input_as_3d = false;

1274

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1275

kernel_info.activation_info = act_info;

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1276

kernel_info.fp_mixed_precision = fp_mixed_precision;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1277

1278

// The output tensor will be auto-initialized within the function

1279

1280

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1281

ReshapeLHSOperatorType reshape_lhs;

1282

ReshapeRHSOperatorType reshape_rhs;

1283

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1284

1285

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1286

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1292

reshape_lhs.configure(lhs.info(), lhs_reshaped.info(), lhs_info);

1293

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1294

gemm.configure(lhs_reshaped.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1295

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1296

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1297

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1298

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1299

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1300

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1301

if(!rhs_info.export_to_cl_image)

1302

{

1303

add_padding_x({ &lhs, &rhs, &lhs_reshaped, &rhs_reshaped, &bias, &dst });

1304

}

1305

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1306

// Allocate tensors

1307

lhs.allocator()->allocate();

1308

rhs.allocator()->allocate();

1309

lhs_reshaped.allocator()->allocate();

1310

rhs_reshaped.allocator()->allocate();

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1311

bias.allocator()->allocate();

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1312

dst.allocator()->allocate();

1313

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1314

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1315

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1316

ARM_COMPUTE_ASSERT(!lhs_reshaped.info()->is_resizable());

1317

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1318

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1319

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1320

1321

// Fill tensors

1322

fill(AccessorType(lhs), 0);

1323

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1324

fill(AccessorType(bias), 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1325

1326

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1327

ITensorPack reshape_lhs_pack = { { ACL_SRC, &lhs }, { ACL_DST, &lhs_reshaped } };

1328

reshape_lhs.run(reshape_lhs_pack);

1329

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1330

reshape_rhs.run(reshape_rhs_pack);

1331

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs_reshaped },

1332

{ ACL_SRC_1, &rhs_reshaped },

1333

{ ACL_SRC_2, &bias },

1334

{ ACL_DST, &dst }

1335

});

1336

gemm.run(gemm_pack);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1341

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1342

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1343

{

1344

TensorShape dst_shape = lhs_shape;

1345

dst_shape.set(0, rhs_shape[0]);

1346

dst_shape.set(1, lhs_shape[1] / m_h);

1347

dst_shape.set(2, m_h);

1348

dst_shape.set(3, lhs_shape[2]);

1349

1350

// Create reference

1351

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1352

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1353

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1354

1355

const int n = rhs_shape[0];

1356

const int m = lhs_shape[1];

1357

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1362

fill(bias, 2);

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1363

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1364

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1365

for(int i = 1; i < m * batch_size; i++)

1366

{

1367

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1368

}

1369

Gian Marco Iodice

0c17aa2

2019-09-27 09:23:15 +0100

[diff] [blame]

1370

if(fp_mixed_precision)

1371

{

1372

return reference::activation_layer(reference::gemm_mixed_precision<T>(lhs, rhs, bias, alpha, beta), act_info);

}

else

{

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

1377

}

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1378

}

1379

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1380

bool validate_result = true;

Gian Marco Iodice

2018-12-17 15:12:07 +0000

[diff] [blame]

1381

TensorType _target{};

1382

SimpleTensor<T> _reference{};

Gian Marco Iodice

2018-12-12 10:18:04 +0000

[diff] [blame]

1383

};

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1384

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1385

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1386

class GEMMMatrixMultiplyReshapedOnlyRHSValidationFixture : public framework::Fixture

1387

{

1388

public:

1389

template <typename...>

1390

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

1391

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1392

{

1393

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1402

rhs_info.transpose = transpose_rhs;

1403

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1404

1405

// Set the tensor shapes for LHS and RHS matrices

1406

const TensorShape lhs_shape(k, m, batch_size);

1407

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1408

const TensorShape bias_shape(n,

1409

broadcast_bias ? 1 : m,

1410

broadcast_bias ? 1 : batch_size);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1411

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1412

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

1413

if(validate_result)

1414

{

1415

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

1416

}

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

}

protected:

template <typename U>

1421

void fill(U &&tensor, int i)

1422

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1423

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1424

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1425

1426

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1427

library->fill(tensor, distribution, i);

1428

1429

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1430

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1431

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1432

}

1433

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1434

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1435

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1436

{

1437

// Create tensors

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1438

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1439

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1440

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1441

TensorType rhs_reshaped;

1442

TensorType dst;

1443

1444

const unsigned int M = lhs_shape[1];

1445

const unsigned int N = rhs_shape[0];

1446

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1447

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1452

kernel_info.reinterpret_input_as_3d = false;

1453

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1454

kernel_info.activation_info = act_info;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1455

1456

// The output tensor will be auto-initialized within the function

1457

1458

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1459

ReshapeRHSOperatorType reshape_rhs;

1460

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1461

1462

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1463

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1469

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1470

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1471

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1472

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1473

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1474

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1475

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1476

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1477

if(!rhs_info.export_to_cl_image)

1478

{

1479

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1480

}

1481

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1482

// Allocate tensors

1483

lhs.allocator()->allocate();

1484

rhs.allocator()->allocate();

1485

rhs_reshaped.allocator()->allocate();

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1486

bias.allocator()->allocate();

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1487

dst.allocator()->allocate();

1488

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1489

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1490

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1491

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1492

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1493

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1494

1495

// Fill tensors

1496

fill(AccessorType(lhs), 0);

1497

fill(AccessorType(rhs), 1);

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1498

fill(AccessorType(bias), 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1499

1500

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1501

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1502

reshape_rhs.run(reshape_rhs_pack);

1503

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1504

{ ACL_SRC_1, &rhs_reshaped },

1505

{ ACL_SRC_2, &bias },

1506

{ ACL_DST, &dst }

1507

});

1508

gemm.run(gemm_pack);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1513

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1514

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1515

{

1516

TensorShape dst_shape = lhs_shape;

1517

dst_shape[0] = rhs_shape[0];

1518

dst_shape[1] = lhs_shape[1];

1519

1520

// Create reference

1521

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1522

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1523

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1524

1525

const int n = rhs_shape[0];

1526

const int m = lhs_shape[1];

1527

const int batch_size = lhs_shape[2];

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1532

fill(bias, 2);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1533

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1534

if(broadcast_bias)

1535

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1536

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1537

for(int i = 1; i < m * batch_size; i++)

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1538

{

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1539

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1540

}

1541

}

Georgios Pinitas

2019-05-21 13:32:43 +0100

[diff] [blame]

1542

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1543

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1544

}

1545

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1546

bool validate_result = true;

Gian Marco Iodice

2019-02-15 11:10:31 +0000

[diff] [blame]

1547

TensorType _target{};

1548

SimpleTensor<T> _reference{};

1549

};

1550

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

1551

/** (EXPERIMENTAL_POST_OPS)*/

1552

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

1553

class GEMMMatrixMultiplyReshapedOnlyRHSWithPostOpsValidationFixture : public framework::Fixture

1554

{

1555

public:

1556

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

1557

template <typename...>

1558

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

1559

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info,

1560

const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

1561

{

1562

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1571

rhs_info.transpose = transpose_rhs;

1572

rhs_info.export_to_cl_image = export_to_cl_image;

1573

1574

// Set the tensor shapes for LHS and RHS matrices

1575

const TensorShape lhs_shape(k, m, batch_size);

1576

const TensorShape rhs_shape(n, k, batch_size);

1577

const TensorShape bias_shape(n,

1578

broadcast_bias ? 1 : m,

1579

broadcast_bias ? 1 : batch_size);

1580

auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

1581

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

1586

std::get<1>(broadcast) ? 1 : m,

1587

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

1592

if(validate_result)

1593

{

1594

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

}

protected:

template <typename U>

1600

void fill(U &&tensor, int i)

1601

{

1602

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

1603

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

1604

1605

DistributionType distribution{ T(-1.0f), T(1.0f) };

1606

library->fill(tensor, distribution, i);

1607

1608

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

1609

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

1610

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1611

}

1612

1613

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1614

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1615

{

1616

// Create tensors

1617

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1618

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1619

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1620

TensorType rhs_reshaped;

1621

TensorType dst;

1622

// Create post op tensors and populate post op with them

1623

std::vector<TensorType> post_op_tensors_holder{};

1624

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

1625

[&post_op_tensors_holder, &data_type](auto shape)

1626

{

1627

auto t = create_tensor<TensorType>(shape, data_type, 1);

1628

post_op_tensors_holder.push_back(std::move(t));

1629

return post_op_tensors_holder.back().info();

1630

});

1631

1632

const unsigned int M = lhs_shape[1];

1633

const unsigned int N = rhs_shape[0];

1634

const unsigned int K = lhs_shape[0];

1635

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

1640

kernel_info.reinterpret_input_as_3d = false;

1641

kernel_info.broadcast_bias = broadcast_bias;

1642

kernel_info.activation_info = act_info;

1643

kernel_info.post_ops = populated_post_ops;

1644

1645

// The output tensor will be auto-initialized within the function

1646

1647

// Create and configure function

1648

ReshapeRHSOperatorType reshape_rhs;

1649

GEMMOperatorType gemm;

1650

1651

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1652

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1659

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

1660

1661

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1662

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1663

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

1664

for(const auto &tensor : post_op_tensors_holder)

1665

{

1666

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

1667

}

1668

1669

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

1670

if(!rhs_info.export_to_cl_image)

1671

{

1672

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1673

for(auto &tensor : post_op_tensors_holder)

1674

{

1675

add_padding_x({ &tensor });

}

}

// Allocate tensors

lhs.allocator()->allocate();

1681

rhs.allocator()->allocate();

1682

rhs_reshaped.allocator()->allocate();

1683

bias.allocator()->allocate();

1684

dst.allocator()->allocate();

1685

for(auto &tensor : post_op_tensors_holder)

1686

{

1687

tensor.allocator()->allocate();

1688

}

1689

1690

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1691

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1692

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1693

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1694

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

1695

for(const auto &tensor : post_op_tensors_holder)

1696

{

1697

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

1702

fill(AccessorType(rhs), 1);

1703

fill(AccessorType(bias), 2);

1704

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1705

{

1706

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1711

reshape_rhs.run(reshape_rhs_pack);

1712

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1713

{ ACL_SRC_1, &rhs_reshaped },

1714

{ ACL_SRC_2, &bias },

1715

{ ACL_DST, &dst }

1716

});

1717

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

1718

{

1719

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

1727

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

1728

{

1729

TensorShape dst_shape = lhs_shape;

1730

dst_shape[0] = rhs_shape[0];

1731

dst_shape[1] = lhs_shape[1];

1732

1733

// Create reference

1734

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1735

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1736

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1737

// Create post op tensors and populate post op with them

1738

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

1739

{

1740

return SimpleTensor<T> { shape, data_type, 1 };

1741

});

1742

1743

const int n = rhs_shape[0];

1744

const int m = lhs_shape[1];

1745

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

1750

fill(rhs, tensor_idx++);

1751

fill(bias, tensor_idx++);

1752

for(auto &op : populated_post_ops.get_list())

1753

{

1754

for(auto tensor : op->arguments())

1755

{

1756

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1762

// In case of broadcast, we need to simply copy the first into the following "M" ones

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

1763

for(int i = 1; i < m * batch_size; i++)

1764

{

1765

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

1771

// Ignore activation info if post ops are used instead

1772

if(populated_post_ops.size() > 0)

1773

{

1774

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

bool validate_result = true;

1784

TensorType _target{};

1785

SimpleTensor<T> _reference{};

1786

};

1787

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1788

template <typename TensorType, typename AccessorType, typename T, typename ReshapeRHSOperatorType, typename GEMMOperatorType>

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1789

class GEMMMatrixMultiplyReshapedOnlyRHS3DValidationFixture : public framework::Fixture

1790

{

1791

public:

1792

template <typename...>

1793

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, unsigned int h0,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1794

bool interleave_rhs, bool transpose_rhs, bool export_to_cl_image, bool has_pad_y, DataType data_type, float alpha, float beta, const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1795

{

1796

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

Gian Marco Iodice

781cba7

2020-06-19 16:56:57 +0100

[diff] [blame]

rhs_info.n0 = n0;

rhs_info.k0 = k0;

rhs_info.h0 = h0;

rhs_info.interleave = interleave_rhs;

1805

rhs_info.transpose = transpose_rhs;

1806

rhs_info.export_to_cl_image = export_to_cl_image;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1807

1808

// In case of GEMM3D, m is the product between m_w and m_h

1809

const unsigned int m = m_w * m_h;

1810

1811

// Set the tensor shapes for LHS and RHS matrices

1812

const TensorShape lhs_shape(k, m, batch_size);

1813

const TensorShape rhs_shape(n, k, batch_size);

1814

const TensorShape bias_shape(n, 1, 1);

1815

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1816

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info, has_pad_y);

1817

if(validate_result)

1818

{

1819

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

1820

}

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

}

protected:

template <typename U>

1825

void fill(U &&tensor, int i)

1826

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1827

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1828

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1829

1830

DistributionType distribution{ T(-1.0f), T(1.0f) };

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1831

library->fill(tensor, distribution, i);

1832

}

1833

1834

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

1835

DataType data_type, float alpha, float beta,

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1836

unsigned int m_h, const ActivationLayerInfo &act_info, bool has_pad_y)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1837

{

1838

// Create tensors

1839

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

1840

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

1841

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

1842

TensorType rhs_reshaped;

1843

TensorType dst;

1844

1845

const unsigned int M = lhs_shape[1];

1846

const unsigned int N = rhs_shape[0];

1847

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

1848

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

1853

kernel_info.reinterpret_input_as_3d = false;

1854

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1855

kernel_info.activation_info = act_info;

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1856

kernel_info.has_pad_y = has_pad_y;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1857

1858

// The output tensor will be auto-initialized within the function

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1859

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1860

ReshapeRHSOperatorType reshape_rhs;

1861

GEMMOperatorType gemm;

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1862

1863

validate_result = bool(reshape_rhs.validate(rhs.info(), rhs_reshaped.info(), rhs_info));

1864

validate_result = validate_result || !rhs_info.export_to_cl_image;

if(!validate_result)

{

return nullptr;

}

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1870

reshape_rhs.configure(rhs.info(), rhs_reshaped.info(), rhs_info);

1871

gemm.configure(lhs.info(), rhs_reshaped.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1872

Gian Marco Iodice

2020-10-22 16:37:12 +0100

[diff] [blame]

1873

if(has_pad_y)

1874

{

1875

// Add dummy padding into lhs to validate has_pad_y path

1876

lhs.info()->extend_padding(PaddingSize(2, 0, 2, 0));

1877

dst.info()->extend_padding(PaddingSize(2, 0, 1, 0));

1878

}

1879

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1880

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

1881

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

1882

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1883

Georgios Pinitas

2021-04-13 13:35:58 +0100

[diff] [blame]

1884

// We do not pad when using image as it needs to comply to strict pitch alignment restrictions

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

1885

if(!rhs_info.export_to_cl_image)

1886

{

1887

add_padding_x({ &lhs, &rhs, &rhs_reshaped, &bias, &dst });

1888

}

1889

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1890

// Allocate tensors

1891

lhs.allocator()->allocate();

1892

rhs.allocator()->allocate();

1893

rhs_reshaped.allocator()->allocate();

1894

bias.allocator()->allocate();

1895

dst.allocator()->allocate();

1896

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

1897

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

1898

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

1899

ARM_COMPUTE_ASSERT(!rhs_reshaped.info()->is_resizable());

1900

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

1901

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1902

1903

// Fill tensors

1904

fill(AccessorType(lhs), 0);

1905

fill(AccessorType(rhs), 1);

1906

fill(AccessorType(bias), 2);

1907

1908

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1909

ITensorPack reshape_rhs_pack = { { ACL_SRC, &rhs }, { ACL_DST, &rhs_reshaped } };

1910

reshape_rhs.run(reshape_rhs_pack);

1911

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

1912

{ ACL_SRC_1, &rhs_reshaped },

1913

{ ACL_SRC_2, &bias },

1914

{ ACL_DST, &dst }

1915

});

1916

gemm.run(gemm_pack);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1921

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1922

const ActivationLayerInfo &act_info)

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1923

{

1924

TensorShape dst_shape = lhs_shape;

1925

dst_shape.set(0, rhs_shape[0]);

1926

dst_shape.set(1, lhs_shape[1] / m_h);

1927

dst_shape.set(2, m_h);

1928

dst_shape.set(3, lhs_shape[2]);

1929

1930

// Create reference

1931

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

1932

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

1933

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

1934

1935

const int n = rhs_shape[0];

1936

const int m = lhs_shape[1];

1937

const int batch_size = lhs_shape[2];

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

fill(bias, 2);

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

1944

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1945

for(int i = 1; i < m * batch_size; i++)

1946

{

1947

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

1948

}

1949

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1950

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1951

}

1952

Sheri Zhang

2020-11-16 21:17:28 +0000

[diff] [blame]

1953

bool validate_result = true;

Gian Marco Iodice

2019-06-14 16:11:10 +0100

[diff] [blame]

1954

TensorType _target{};

1955

SimpleTensor<T> _reference{};

1956

};

1957

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

1958

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1959

class GEMMMatrixMultiplyNativeValidationFixture : public framework::Fixture

1960

{

1961

public:

1962

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1963

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

1964

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1965

{

1966

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

1975

const TensorShape lhs_shape(k, m, batch_size);

1976

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

1977

const TensorShape bias_shape(n,

1978

broadcast_bias ? 1 : m,

1979

broadcast_bias ? 1 : batch_size);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1980

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

1981

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

1982

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

1987

void fill(U &&tensor, int i)

1988

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1989

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

1990

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1991

1992

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1993

library->fill(tensor, distribution, i);

1994

1995

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

1996

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

1997

library->fill_borders_with_garbage(tensor, distribution_inf, i);

1998

}

1999

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2000

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2001

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2002

{

2003

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2004

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2005

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2006

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2007

TensorType dst;

2008

2009

const unsigned int M = lhs_shape[1];

2010

const unsigned int N = rhs_shape[0];

2011

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

2012

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

2017

kernel_info.reinterpret_input_as_3d = false;

2018

kernel_info.broadcast_bias = broadcast_bias;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2019

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2020

2021

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2022

GEMMOperatorType gemm;

2023

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2024

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2025

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2026

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2027

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2028

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2029

add_padding_x({ &lhs, &rhs, &bias, &dst });

2030

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2031

// Allocate tensors

2032

lhs.allocator()->allocate();

2033

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2034

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2035

dst.allocator()->allocate();

2036

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2037

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2038

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2039

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2040

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2041

2042

// Fill tensors

2043

fill(AccessorType(lhs), 0);

2044

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2045

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2046

2047

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2048

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2049

{ ACL_SRC_1, &rhs },

2050

{ ACL_SRC_2, &bias },

2051

{ ACL_DST, &dst }

2052

});

2053

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2058

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2059

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2060

{

2061

TensorShape dst_shape = lhs_shape;

2062

dst_shape[0] = rhs_shape[0];

2063

dst_shape[1] = lhs_shape[1];

2064

2065

// Create reference

2066

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2067

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2068

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2069

2070

const int n = rhs_shape[0];

2071

const int m = lhs_shape[1];

2072

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2077

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2078

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2079

if(broadcast_bias)

2080

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

2081

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2082

for(int i = 1; i < m * batch_size; i++)

2083

{

2084

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2088

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2089

}

2090

2091

TensorType _target{};

2092

SimpleTensor<T> _reference{};

2093

};

2094

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2095

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

2096

class GEMMMatrixMultiplyNativeWithPostOpsValidationFixture : public framework::Fixture

2097

{

2098

public:

2099

using PostOpArgBroadcast = std::tuple<bool, bool, bool>; // Instruct fixture if we need broadcasting in dimension 0, 1, 2 of each PostOp argument

2100

public:

2101

template <typename...>

2102

void setup(unsigned int m, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta, bool broadcast_bias,

2103

const ActivationLayerInfo &act_info, const experimental::PostOpList<PostOpArgBroadcast> &post_ops)

2104

{

2105

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// Set the tensor shapes for LHS and RHS matrices

2114

const TensorShape lhs_shape(k, m, batch_size);

2115

const TensorShape rhs_shape(n, k, batch_size);

2116

const TensorShape bias_shape(n,

2117

broadcast_bias ? 1 : m,

2118

broadcast_bias ? 1 : batch_size);

2119

const auto post_ops_with_shapes = experimental::transform_post_op_list_arguments<PostOpArgBroadcast, TensorShape>(post_ops,

2120

[ = ](auto broadcast)

{

return TensorShape

{

std::get<0>(broadcast) ? 1 : n,

2125

std::get<1>(broadcast) ? 1 : m,

2126

std::get<2>(broadcast) ? 1 : batch_size,

};

});

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

2131

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, broadcast_bias, act_info, post_ops_with_shapes);

}

protected:

template <typename U>

2136

void fill(U &&tensor, int i)

2137

{

2138

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

2139

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

2140

2141

DistributionType distribution{ T(-1.0f), T(1.0f) };

2142

library->fill(tensor, distribution, i);

2143

2144

// Fill border with infinity in order to check the presence of NaN values (i.e. inf * 0)

2145

DistributionType distribution_inf{ T(std::numeric_limits<float>::infinity()), T(std::numeric_limits<float>::infinity()) };

2146

library->fill_borders_with_garbage(tensor, distribution_inf, i);

2147

}

2148

2149

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

2150

DataType data_type, float alpha, float beta, bool broadcast_bias, const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

2151

{

2152

// Create tensors

2153

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2154

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2155

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

2156

TensorType dst;

2157

// Create post op tensors and populate post op with them

2158

std::vector<TensorType> post_op_tensors_holder{};

2159

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, ITensorInfo *>(post_ops,

2160

[&post_op_tensors_holder, &data_type](auto shape)

2161

{

2162

auto t = create_tensor<TensorType>(shape, data_type, 1);

2163

post_op_tensors_holder.push_back(std::move(t));

2164

return post_op_tensors_holder.back().info();

2165

});

2166

2167

const unsigned int M = lhs_shape[1];

2168

const unsigned int N = rhs_shape[0];

2169

const unsigned int K = lhs_shape[0];

2170

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = 0;

2175

kernel_info.reinterpret_input_as_3d = false;

2176

kernel_info.broadcast_bias = broadcast_bias;

2177

kernel_info.activation_info = act_info;

2178

kernel_info.post_ops = populated_post_ops;

2179

2180

// Create and configure function

2181

GEMMOperatorType gemm;

2182

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

2183

2184

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2185

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2186

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

2187

for(const auto &tensor : post_op_tensors_holder)

2188

{

2189

ARM_COMPUTE_ASSERT(tensor.info()->is_resizable());

2190

}

2191

2192

add_padding_x({ &lhs, &rhs, &bias, &dst });

2193

for(auto &tensor : post_op_tensors_holder)

2194

{

2195

add_padding_x({ &tensor });

}

// Allocate tensors

lhs.allocator()->allocate();

2200

rhs.allocator()->allocate();

2201

bias.allocator()->allocate();

2202

dst.allocator()->allocate();

2203

for(auto &tensor : post_op_tensors_holder)

2204

{

2205

tensor.allocator()->allocate();

2206

}

2207

2208

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2209

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2210

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2211

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

2212

for(const auto &tensor : post_op_tensors_holder)

2213

{

2214

ARM_COMPUTE_ASSERT(!tensor.info()->is_resizable());

}

// Fill tensors

fill(AccessorType(lhs), 0);

2219

fill(AccessorType(rhs), 1);

2220

fill(AccessorType(bias), 2);

2221

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

2222

{

2223

fill(AccessorType(post_op_tensors_holder.at(i)), 3 + i);

}

// Compute GEMM

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2228

{ ACL_SRC_1, &rhs },

2229

{ ACL_SRC_2, &bias },

2230

{ ACL_DST, &dst }

2231

});

2232

for(size_t i = 0; i < post_op_tensors_holder.size(); ++i)

2233

{

2234

gemm_pack.add_tensor(experimental::get_post_op_arg_type(i), &post_op_tensors_holder.at(i));

}

gemm.run(gemm_pack);

return dst;

}

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, bool broadcast_bias,

2242

const ActivationLayerInfo &act_info, const experimental::PostOpList<TensorShape> &post_ops)

2243

{

2244

TensorShape dst_shape = lhs_shape;

2245

dst_shape[0] = rhs_shape[0];

2246

dst_shape[1] = lhs_shape[1];

2247

2248

// Create reference

2249

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2250

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

2251

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2252

// Create post op tensors and populate post op with them

2253

auto populated_post_ops = experimental::transform_post_op_list_arguments<TensorShape, SimpleTensor<T>>(post_ops, [&data_type](auto shape)

2254

{

2255

return SimpleTensor<T> { shape, data_type, 1 };

2256

});

2257

2258

const int n = rhs_shape[0];

2259

const int m = lhs_shape[1];

2260

const int batch_size = lhs_shape[2];

// Fill reference

int tensor_idx = 0;

fill(lhs, tensor_idx++);

2265

fill(rhs, tensor_idx++);

2266

fill(bias, tensor_idx++);

2267

for(auto &op : populated_post_ops.get_list())

2268

{

2269

for(auto tensor : op->arguments())

2270

{

2271

fill(*tensor, tensor_idx++);

}

}

if(broadcast_bias)

{

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

2277

// In case of broadcast, we need to simply copy the first into the following "M" ones

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

2278

for(int i = 1; i < m * batch_size; i++)

2279

{

2280

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

}

}

SimpleTensor<T> out;

out = reference::gemm<T>(lhs, rhs, bias, alpha, beta);

2286

// Ignore activation info if post ops are used instead

2287

if(populated_post_ops.size() > 0)

2288

{

2289

out = reference::post_ops<T>(out, populated_post_ops);

}

else

{

out = reference::activation_layer(out, act_info);

}

return out;

}

TensorType _target{};

2299

SimpleTensor<T> _reference{};

2300

};

2301

2302

template <typename TensorType, typename AccessorType, typename T, typename GEMMOperatorType>

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2303

class GEMMMatrixMultiplyNative3DValidationFixture : public framework::Fixture

2304

{

2305

public:

2306

template <typename...>

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2307

void setup(unsigned int m_w, unsigned int m_h, unsigned int n, unsigned int k, unsigned int batch_size, unsigned int m0, unsigned int n0, unsigned int k0, DataType data_type, float alpha, float beta,

2308

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2309

{

2310

GEMMLHSMatrixInfo lhs_info;

lhs_info.m0 = m0;

lhs_info.k0 = k0;

GEMMRHSMatrixInfo rhs_info;

rhs_info.n0 = n0;

rhs_info.k0 = k0;

// In case of GEMM3D, m is the product between m_w and m_h

2319

const unsigned int m = m_w * m_h;

2320

2321

// Set the tensor shapes for LHS and RHS matrices

2322

const TensorShape lhs_shape(k, m, batch_size);

2323

const TensorShape rhs_shape(n, k, batch_size);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2324

const TensorShape bias_shape(n, 1, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2325

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2326

_target = compute_target(lhs_shape, rhs_shape, bias_shape, lhs_info, rhs_info, data_type, alpha, beta, m_h, act_info);

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2327

_reference = compute_reference(lhs_shape, rhs_shape, data_type, alpha, beta, m_h, act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

protected:

template <typename U>

2332

void fill(U &&tensor, int i)

2333

{

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2334

static_assert(std::is_floating_point<T>::value || std::is_same<T, half>::value, "Only floating point data types supported.");

Giorgio Arena

2021-01-08 10:37:15 +0000

[diff] [blame]

2335

using DistributionType = typename std::conditional<std::is_same<T, half>::value, arm_compute::utils::uniform_real_distribution_16bit<T>, std::uniform_real_distribution<T>>::type;

Giorgio Arena

2020-12-17 16:47:07 +0000

[diff] [blame]

2336

2337

DistributionType distribution{ T(-1.0f), T(1.0f) };

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2338

library->fill(tensor, distribution, i);

2339

}

2340

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2341

TensorType compute_target(const TensorShape &lhs_shape, const TensorShape &rhs_shape, const TensorShape &bias_shape, const GEMMLHSMatrixInfo &lhs_info, const GEMMRHSMatrixInfo &rhs_info,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2342

DataType data_type, float alpha, float beta, unsigned int m_h, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2343

{

2344

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2345

TensorType lhs = create_tensor<TensorType>(lhs_shape, data_type, 1);

2346

TensorType rhs = create_tensor<TensorType>(rhs_shape, data_type, 1);

2347

TensorType bias = create_tensor<TensorType>(bias_shape, data_type, 1);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2348

TensorType dst;

2349

2350

const unsigned int M = lhs_shape[1];

2351

const unsigned int N = rhs_shape[0];

2352

const unsigned int K = lhs_shape[0];

Gian Marco Iodice

2019-06-26 17:18:11 +0100

[diff] [blame]

2353

GEMMKernelInfo kernel_info;

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.depth_output_gemm3d = m_h;

2358

kernel_info.reinterpret_input_as_3d = false;

2359

kernel_info.broadcast_bias = true;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2360

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2361

2362

// The output tensor will be auto-initialized within the function

2363

2364

// Create and configure function

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2365

GEMMOperatorType gemm;

2366

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), alpha, beta, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2367

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2368

ARM_COMPUTE_ASSERT(lhs.info()->is_resizable());

2369

ARM_COMPUTE_ASSERT(rhs.info()->is_resizable());

2370

ARM_COMPUTE_ASSERT(bias.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2371

Giorgio Arena

2021-03-25 14:54:50 +0000

[diff] [blame]

2372

add_padding_x({ &lhs, &rhs, &bias, &dst });

2373

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2374

// Allocate tensors

2375

lhs.allocator()->allocate();

2376

rhs.allocator()->allocate();

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2377

bias.allocator()->allocate();

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2378

dst.allocator()->allocate();

2379

Michele Di Giorgio

2021-04-30 18:30:41 +0100

[diff] [blame]

2380

ARM_COMPUTE_ASSERT(!lhs.info()->is_resizable());

2381

ARM_COMPUTE_ASSERT(!rhs.info()->is_resizable());

2382

ARM_COMPUTE_ASSERT(!bias.info()->is_resizable());

2383

ARM_COMPUTE_ASSERT(!dst.info()->is_resizable());

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2384

2385

// Fill tensors

2386

fill(AccessorType(lhs), 0);

2387

fill(AccessorType(rhs), 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2388

fill(AccessorType(bias), 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2389

2390

// Compute GEMM

Georgios Pinitas

2021-04-22 21:13:21 +0100

[diff] [blame]

2391

ITensorPack gemm_pack({ { ACL_SRC_0, &lhs },

2392

{ ACL_SRC_1, &rhs },

2393

{ ACL_SRC_2, &bias },

2394

{ ACL_DST, &dst }

2395

});

2396

gemm.run(gemm_pack);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

return dst;

}

Michalis Spyrou

2019-10-02 17:22:11 +0100

[diff] [blame]

2401

SimpleTensor<T> compute_reference(const TensorShape &lhs_shape, const TensorShape &rhs_shape, DataType data_type, float alpha, float beta, unsigned int m_h,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2402

const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2403

{

2404

TensorShape dst_shape = lhs_shape;

2405

dst_shape.set(0, rhs_shape[0]);

2406

dst_shape.set(1, lhs_shape[1] / m_h);

2407

dst_shape.set(2, m_h);

2408

dst_shape.set(3, lhs_shape[2]);

2409

2410

// Create reference

2411

SimpleTensor<T> lhs{ lhs_shape, data_type, 1 };

2412

SimpleTensor<T> rhs{ rhs_shape, data_type, 1 };

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2413

SimpleTensor<T> bias{ dst_shape, data_type, 1 };

2414

2415

const int n = rhs_shape[0];

2416

const int m = lhs_shape[1];

2417

const int batch_size = lhs_shape[2];

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

// Fill reference

fill(lhs, 0);

fill(rhs, 1);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2422

fill(bias, 2);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2423

Gunes Bayir

2021-12-10 16:17:56 +0000

[diff] [blame]

2424

// In case of broadcast, we need to simply copy the first into the following "M" ones

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

2425

for(int i = 1; i < m * batch_size; i++)

2426

{

2427

memcpy(bias.data() + i * n, bias.data(), n * sizeof(T));

2428

}

2429

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

2430

return reference::activation_layer(reference::gemm<T>(lhs, rhs, bias, alpha, beta), act_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

2431

}

2432

2433

TensorType _target{};

2434

SimpleTensor<T> _reference{};

2435

};

2436

Gunes Bayir