Blame - tests/validation/CL/GEMMMatrixMultiplyNative.cpp - ml/ComputeLibrary

2021-10-24 19:12:33 +0100

[diff] [blame]

206

/** Different Post Op Lists */

207

const auto post_op_lists = framework::dataset::make("post_op_lists", {

208

post_ops_1(),

209

post_ops_2(),

210

post_ops_3(),

ramelg01

6049eda

2021-10-29 10:52:53 +0100

[diff] [blame]

211

post_ops_4(),

212

post_ops_5()

213

} );

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

214

215

bool is_post_op_list_valid(unsigned int m, unsigned int n, unsigned int k, unsigned int batch, DataType data_type, const experimental::PostOpList<ITensorInfo*>& post_ops)

216

{

217

const auto lhs_info = GEMMLHSMatrixInfo(4,4,1,false,true);

218

const auto rhs_info = GEMMRHSMatrixInfo(4,4,1,true,true,false);

219

220

// Create TensorInfo for post op arguments

221

TensorInfo input0_info(TensorShape(k, m, batch), 1, data_type);

222

TensorInfo input1_info(TensorShape(n, k, batch), 1, data_type);

223

TensorInfo input2_info(TensorShape(n), 1, data_type);

224

TensorInfo output_info(TensorShape(n, m, batch), 1, data_type);

225

226

GEMMKernelInfo gemm_info(m, n, k, 0 /**< Depth of the output tensor in case is reinterpreted as 3D */,

227

false /**< reinterpret the input as 3D */,

228

true /**< Flag used to broadcast the bias addition */,

229

false /**< wider accumm */,

230

false /**< has pad y */,

231

ActivationLayerInfo::ActivationFunction::IDENTITY,

232

1 /**< Multiplication factor for the width of the 1xW transposed block */,

233

1 /**< Multiplication factor for the height of the 4x4 interleaved block */,

234

lhs_info,

235

rhs_info,

236

0 /**< Offset to be added to each element of the matrix A */,

237

0 /**< Offset to be added to each element of the matrix B */,

238

post_ops);

239

return bool(ClGemmMatrixMultiplyNativeKernel::validate(&input0_info.clone()->set_is_resizable(true),

240

&input1_info.clone()->set_is_resizable(true),

241

&input2_info.clone()->set_is_resizable(true),

242

&output_info.clone()->set_is_resizable(true),1.f,1.f,

lhs_info,

rhs_info,

gemm_info));

}

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

248

/** Configuration test */

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

249

void validate_configuration(unsigned int m_value, unsigned int n_value, unsigned int k_value, unsigned int b_value, unsigned int m0_value, unsigned int n0_value, unsigned int k0_value, bool broadcast_bias, DataType data_type, const ActivationLayerInfo &act_info)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

250

{

251

const unsigned int M = m_value;

252

const unsigned int N = n_value;

253

const unsigned int K = k_value;

254

255

GEMMLHSMatrixInfo lhs_info;

256

lhs_info.m0 = m0_value;

257

lhs_info.k0 = k0_value;

258

259

GEMMRHSMatrixInfo rhs_info;

260

rhs_info.n0 = n0_value;

261

rhs_info.k0 = k0_value;

262

Gian Marco Iodice

7026b30

2019-06-26 17:18:11 +0100

[diff] [blame]

263

GEMMKernelInfo kernel_info;

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

kernel_info.m = M;

kernel_info.n = N;

kernel_info.k = K;

kernel_info.broadcast_bias = broadcast_bias;

268

kernel_info.activation_info = act_info;

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

269

270

const TensorShape lhs_shape(K, M, b_value);

271

const TensorShape rhs_shape(N, K, b_value);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

272

const TensorShape bias_shape(N,

273

broadcast_bias? 1 : M,

274

broadcast_bias? 1 : b_value);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

275

const TensorShape dst_shape = compute_mm_shape(TensorInfo(lhs_shape, 1, data_type),

276

TensorInfo(rhs_shape, 1, data_type),

Gian Marco Iodice

7026b30

2019-06-26 17:18:11 +0100

[diff] [blame]

277

kernel_info);

278

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

279

// Create tensors

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

280

CLTensor lhs = create_tensor<CLTensor>(lhs_shape, data_type);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

281

CLTensor rhs = create_tensor<CLTensor>(rhs_shape, data_type);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

282

CLTensor bias = create_tensor<CLTensor>(bias_shape, data_type);

283

CLTensor dst = create_tensor<CLTensor>(dst_shape, data_type);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

284

285

ARM_COMPUTE_EXPECT(lhs.info()->is_resizable(), framework::LogLevel::ERRORS);

286

ARM_COMPUTE_EXPECT(rhs.info()->is_resizable(), framework::LogLevel::ERRORS);

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

287

ARM_COMPUTE_EXPECT(bias.info()->is_resizable(), framework::LogLevel::ERRORS);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

288

ARM_COMPUTE_EXPECT(dst.info()->is_resizable(), framework::LogLevel::ERRORS);

289

290

// Create and configure function

291

CLGEMMMatrixMultiplyNative gemm;

Georgios Pinitas

856f66e

2021-04-22 21:13:21 +0100

[diff] [blame]

292

gemm.configure(lhs.info(), rhs.info(), bias.info(), dst.info(), 1.0f, 1.0f, lhs_info, rhs_info, kernel_info);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

}

} // namespace

TEST_SUITE(CL)

TEST_SUITE(GEMMMatrixMultiplyNative)

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

298

TEST_SUITE(ValidateFusedPostOpsConfigs)

299

TEST_SUITE(Invalid)

300

TEST_CASE(UnsupportedPostOpSequence, framework::DatasetMode::ALL)

301

{

302

const auto data_type = DataType::F32;

303

const unsigned int m = 17;

304

const unsigned int n = 1;

305

const unsigned int k = 13;

306

const unsigned int batch = 2;

307

TensorShape post_op_arg0_shape(n, m, batch);

308

TensorInfo post_op_arg_info(post_op_arg0_shape, 1, data_type);

309

auto post_op_arg1_info = post_op_arg_info.clone();

310

311

// Unsupported sequence of post ops

312

experimental::PostOpList<ITensorInfo*> post_ops{};

313

post_ops.push_back_op<experimental::PostOpEltwiseAdd<ITensorInfo*>>(

314

&post_op_arg_info,

315

1,

316

ConvertPolicy::SATURATE);

317

post_ops.push_back_op<experimental::PostOpEltwiseAdd<ITensorInfo*>>(

318

post_op_arg1_info.get(),

319

0,

320

ConvertPolicy::SATURATE);

321

322

ARM_COMPUTE_EXPECT(is_post_op_list_valid(m, n, k, batch, data_type, post_ops) == false, framework::LogLevel::ERRORS);

323

}

324

TEST_CASE(OutputWidened, framework::DatasetMode::ALL)

325

{

326

// Invalid broadcast: post op tensors "widen" the output tensor

327

const auto data_type = DataType::F32;

328

const unsigned int m = 1;

329

const unsigned int n = 18;

330

const unsigned int k = 13;

331

const unsigned int batch = 2;

332

TensorShape post_op_arg_shape(n, m + 1, batch); // output's Y dimension (m) is "widened", which is not allowed

333

TensorInfo post_op_arg_info(post_op_arg_shape, 1, data_type);

334

experimental::PostOpList<ITensorInfo*> post_ops{};

335

post_ops.push_back_op<experimental::PostOpEltwiseAdd<ITensorInfo*>>( &post_op_arg_info, 0, ConvertPolicy::SATURATE);

336

337

ARM_COMPUTE_EXPECT(is_post_op_list_valid(m, n, k, batch, data_type, post_ops) == false, framework::LogLevel::ERRORS);

338

}

339

TEST_CASE(BroadcastInXDimOnly, framework::DatasetMode::ALL)

340

{

341

// Invalid broadcast: post op tensors broadcast in the first dimension (X) only

342

const auto data_type = DataType::F32;

343

const unsigned int m = 22;

344

const unsigned int n = 16;

345

const unsigned int k = 15;

346

const unsigned int batch = 3;

347

TensorShape post_op_arg_shape(1, m, batch);

348

TensorInfo post_op_arg_info(post_op_arg_shape, 1, data_type);

349

experimental::PostOpList<ITensorInfo*> post_ops{};

350

post_ops.push_back_op<experimental::PostOpEltwiseAdd<ITensorInfo*>>( &post_op_arg_info, 0, ConvertPolicy::SATURATE);

351

352

ARM_COMPUTE_EXPECT(is_post_op_list_valid(m, n, k, batch, data_type, post_ops) == false, framework::LogLevel::ERRORS);

353

}

354

TEST_SUITE_END() // Invalid

355

TEST_SUITE(Valid)

356

TEST_CASE(EmptyPostOpList, framework::DatasetMode::ALL)

357

{

358

const auto data_type = DataType::F32;

359

const unsigned int m = 22;

360

const unsigned int n = 16;

361

const unsigned int k = 15;

362

const unsigned int batch = 3;

363

experimental::PostOpList<ITensorInfo*> post_ops{};

364

365

ARM_COMPUTE_EXPECT(is_post_op_list_valid(m, n, k, batch, data_type, post_ops) == true, framework::LogLevel::ERRORS);

366

}

367

TEST_CASE(BroadcastInYDimOnly, framework::DatasetMode::ALL)

368

{

369

const auto data_type = DataType::F32;

370

const unsigned int m = 22;

371

const unsigned int n = 16;

372

const unsigned int k = 15;

373

const unsigned int batch = 3;

374

TensorShape post_op_arg_shape(n, 1, batch);

375

TensorInfo post_op_arg_info(post_op_arg_shape, 1, data_type);

376

experimental::PostOpList<ITensorInfo*> post_ops{};

377

post_ops.push_back_op<experimental::PostOpEltwiseAdd<ITensorInfo*>>( &post_op_arg_info, 0, ConvertPolicy::SATURATE);

378

379

ARM_COMPUTE_EXPECT(is_post_op_list_valid(m, n, k, batch, data_type, post_ops) == true, framework::LogLevel::ERRORS);

380

}

381

TEST_CASE(BroadcastInBothXandYDims, framework::DatasetMode::ALL)

382

{

383

const auto data_type = DataType::F32;

384

const unsigned int m = 22;

385

const unsigned int n = 16;

386

const unsigned int k = 15;

387

const unsigned int batch = 3;

388

TensorShape post_op_arg_shape(1, 1, batch);

389

TensorInfo post_op_arg_info(post_op_arg_shape, 1, data_type);

390

experimental::PostOpList<ITensorInfo*> post_ops{};

391

post_ops.push_back_op<experimental::PostOpEltwiseAdd<ITensorInfo*>>( &post_op_arg_info, 0, ConvertPolicy::SATURATE);

392

393

ARM_COMPUTE_EXPECT(is_post_op_list_valid(m, n, k, batch, data_type, post_ops) == true, framework::LogLevel::ERRORS);

394

}

395

TEST_CASE(BroadcastInAllDims, framework::DatasetMode::ALL)

396

{

397

const auto data_type = DataType::F32;

398

const unsigned int m = 22;

399

const unsigned int n = 16;

400

const unsigned int k = 15;

401

const unsigned int batch = 3;

402

TensorShape post_op_arg_shape(1, 1, 1);

403

TensorInfo post_op_arg_info(post_op_arg_shape, 1, data_type);

404

experimental::PostOpList<ITensorInfo*> post_ops{};

405

post_ops.push_back_op<experimental::PostOpEltwiseAdd<ITensorInfo*>>( &post_op_arg_info, 0, ConvertPolicy::SATURATE);

406

407

ARM_COMPUTE_EXPECT(is_post_op_list_valid(m, n, k, batch, data_type, post_ops) == true, framework::LogLevel::ERRORS);

408

}

409

TEST_SUITE_END() // Valid

410

TEST_SUITE_END() // ValidateFusedPostOps

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

411

TEST_SUITE(Float)

412

TEST_SUITE(FP32)

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

413

DATA_TEST_CASE(Configuration, framework::DatasetMode::ALL, combine(combine(combine(combine(combine(combine(combine(combine(

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

m_values,

n_values),

k_values),

framework::dataset::make("batch_size", 1)),

418

m0_values_precommit),

419

n0_values_precommit),

420

k0_values_precommit),

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

421

broadcast_bias_values),

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

422

act_values),

423

m_value, n_value, k_value, b_value, m0_value, n0_value, k0_value, broadcast_bias, act_value)

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

424

{

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

425

validate_configuration(m_value, n_value, k_value, b_value, m0_value, n0_value, k0_value, broadcast_bias, DataType::F32, act_value);

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

426

}

427

SiCong Li

b972ae6

2020-08-03 15:39:45 +0100

[diff] [blame]

428

FIXTURE_DATA_TEST_CASE(RunSmallBoundaryHandlingPartialInXPartialInY, CLGEMMMatrixMultiplyNativeFixture<float>, framework::DatasetMode::ALL,

429

combine(combine(

430

framework::dataset::make("M", 3),

431

framework::dataset::make("N", 1)),

432

boundary_handling_cases))

433

{

434

// Validate output

435

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

436

}

437

438

FIXTURE_DATA_TEST_CASE(RunSmallBoundaryHandlingPartialInXFullInY, CLGEMMMatrixMultiplyNativeFixture<float>, framework::DatasetMode::ALL,

439

combine(combine(

440

framework::dataset::make("M", 64),

441

framework::dataset::make("N", 51)),

442

boundary_handling_cases))

443

{

444

// Validate output

445

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

446

}

447

448

FIXTURE_DATA_TEST_CASE(RunSmallBoundaryHandlingFullInXFullInY, CLGEMMMatrixMultiplyNativeFixture<float>, framework::DatasetMode::ALL,

449

combine(combine(

450

framework::dataset::make("M", 64),

451

framework::dataset::make("N", 32)),

452

boundary_handling_cases))

453

{

454

// Validate output

455

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

456

}

457

458

FIXTURE_DATA_TEST_CASE(RunSmallBoundaryHandlingFullInXPartialInY, CLGEMMMatrixMultiplyNativeFixture<float>, framework::DatasetMode::ALL,

459

combine(combine(

460

framework::dataset::make("M", 37),

461

framework::dataset::make("N", 32)),

462

boundary_handling_cases))

463

{

464

// Validate output

465

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

466

}

467

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

468

FIXTURE_DATA_TEST_CASE(RunSmall, CLGEMMMatrixMultiplyNativeFixture<float>, framework::DatasetMode::ALL,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

469

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

m_values,

n_values),

k_values),

b_values),

m0_values_precommit),

475

n0_values_precommit),

476

k0_values_precommit),

477

framework::dataset::make("DataType", DataType::F32)),

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

478

a_values),

479

beta_values),

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

480

broadcast_bias_values),

481

act_values))

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

482

{

483

// Validate output

484

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

485

}

486

Michalis Spyrou

1d89777

2019-12-09 18:47:29 +0000

[diff] [blame]

487

FIXTURE_DATA_TEST_CASE(RunLarge, CLGEMMMatrixMultiplyNativeFixture<float>, framework::DatasetMode::DISABLED,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

488

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

m_values,

n_values),

k_values),

b_values),

m0_values_nightly),

n0_values_nightly),

k0_values_nightly),

framework::dataset::make("DataType", DataType::F32)),

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

497

a_values),

498

beta_values),

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

499

broadcast_bias_values),

500

act_values))

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

501

{

502

// Validate output

503

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

504

}

505

506

FIXTURE_DATA_TEST_CASE(RunSmall3D, CLGEMMMatrixMultiplyNative3DFixture<float>, framework::DatasetMode::ALL,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

507

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

m_w_values,

m_h_values),

n_values),

k_values),

b_values),

m0_values_precommit),

514

n0_values_precommit),

515

k0_values_precommit),

516

framework::dataset::make("DataType", DataType::F32)),

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

517

a_values),

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

518

beta_values),

519

act_values))

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

520

{

521

// Validate output

522

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

523

}

524

Michalis Spyrou

1d89777

2019-12-09 18:47:29 +0000

[diff] [blame]

525

FIXTURE_DATA_TEST_CASE(RunLarge3D, CLGEMMMatrixMultiplyNative3DFixture<float>, framework::DatasetMode::DISABLED,

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

526

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

m_w_values,

m_h_values),

n_values),

k_values),

b_values),

m0_values_nightly),

n0_values_nightly),

k0_values_nightly),

framework::dataset::make("DataType", DataType::F32)),

Gian Marco Iodice

2019-06-24 14:40:30 +0100

[diff] [blame]

536

a_values),

Gian Marco Iodice

2019-07-16 15:46:48 +0100

[diff] [blame]

537

beta_values),

538

act_values))

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

539

{

540

// Validate output

541

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

542

}

SiCongLi

2021-10-24 19:12:33 +0100

[diff] [blame]

543

544

TEST_SUITE(FusedPostOps)

545

546

FIXTURE_DATA_TEST_CASE(RunSmall, CLGEMMMatrixMultiplyNativeWithPostOpsFixture<float>, framework::DatasetMode::ALL,

547

combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(combine(

m_values,

n_values),

k_values),

b_values),

framework::dataset::make("M0", { 4 })),

553

n0_values_precommit),

554

k0_values_precommit),

555

framework::dataset::make("DataType", DataType::F32)),

556

framework::dataset::make("alpha", {1.0f} )),

557

framework::dataset::make("beta", {1.0f} )),

558

framework::dataset::make("broadcast_bias", { false, true } )),

559

framework::dataset::make("Activation", { ActivationLayerInfo() })),

post_op_lists)

)

{

// Validate output

validate(CLAccessor(_target), _reference, rel_tolerance_f32, 0.f, abs_tolerance_f32);

565

}

566

567

TEST_SUITE_END() // FusedPostOps

568

giuros01

2019-04-01 13:50:22 +0100

[diff] [blame]

569

TEST_SUITE_END() // FP32

giuros01