Blame - src/core/NEON/kernels/NEGEMMLowpOffsetContributionKernel.cpp - ml/ComputeLibrary

void NEGEMMLowpOffsetContributionKernel::configure(ITensor *mm_result, const ITensor *vector_sum_col, const ITensor *vector_sum_row, int32_t k, int32_t a_offset, int32_t b_offset)

343

{

Georgios Pinitas

a3b1b46

2017-11-16 19:24:39 +0000

[diff] [blame]

344

// Perform validate step

345

ARM_COMPUTE_ERROR_ON_NULLPTR(mm_result);

346

ARM_COMPUTE_ERROR_THROW_ON(validate_arguments(mm_result->info(),

347

vector_sum_col != nullptr ? vector_sum_col->info() : nullptr, // NOLINT

348

vector_sum_row != nullptr ? vector_sum_row->info() : nullptr, // NOLINT

349

a_offset, b_offset)); // NOLINT

Gian Marco

e75a02b

2017-11-08 12:24:09 +0000

[diff] [blame]

350

351

_vector_sum_col = vector_sum_col;

352

_vector_sum_row = vector_sum_row;

353

_mm_result = mm_result;

354

_a_offset = a_offset;

355

_b_offset = b_offset;

356

_k_offset = a_offset * b_offset * k;

357

Georgios Pinitas

a3b1b46

2017-11-16 19:24:39 +0000

[diff] [blame]

358

// If a_offset == 0, vector_sum_col can be a nullptr

359

if(a_offset != 0)

360

{

Georgios Pinitas

a3b1b46

2017-11-16 19:24:39 +0000

[diff] [blame]

361

// Check if vector_sum_col_shape should be slidden or not

362

// Don't slide vector_sum_col_shape along the y dimension if vector_sum_col_shape has just 1 dimension and vector_sum_row_shape more than 1

363

// This scenario can happen when the the matrix multiplication is used to perform a convolution operation

Isabella Gottardi

e6630e4

2018-01-18 15:50:39 +0000

[diff] [blame]

364

_slide_vector_sum_col = vector_sum_col->info()->tensor_shape().num_dimensions() > 1;

Georgios Pinitas

a3b1b46

2017-11-16 19:24:39 +0000

[diff] [blame]

365

}

Gian Marco

e75a02b

2017-11-08 12:24:09 +0000

[diff] [blame]

366

367

// Configure kernel window

Georgios Pinitas

a3b1b46

2017-11-16 19:24:39 +0000

[diff] [blame]

368

auto win_config = validate_and_configure_window(mm_result->info(),

369

vector_sum_col != nullptr ? vector_sum_col->info() : nullptr, // NOLINT

370

vector_sum_row != nullptr ? vector_sum_row->info() : nullptr, // NOLINT

371

a_offset, b_offset);

372

ARM_COMPUTE_ERROR_THROW_ON(win_config.first);

373

INEKernel::configure(win_config.second);

374

}

Gian Marco

e75a02b

2017-11-08 12:24:09 +0000

[diff] [blame]

375

Georgios Pinitas

631c41a

2017-12-06 11:53:03 +0000

[diff] [blame]

376

Status NEGEMMLowpOffsetContributionKernel::validate(const ITensorInfo *mm_result, const ITensorInfo *vector_sum_col, const ITensorInfo *vector_sum_row,

377

int32_t a_offset, int32_t b_offset)

Georgios Pinitas

a3b1b46

2017-11-16 19:24:39 +0000

[diff] [blame]

378

{

379

ARM_COMPUTE_RETURN_ON_ERROR(validate_arguments(mm_result, vector_sum_col, vector_sum_row, a_offset, b_offset));

380

ARM_COMPUTE_RETURN_ON_ERROR(validate_and_configure_window(mm_result->clone().get(),

381

vector_sum_col != nullptr ? vector_sum_col->clone().get() : nullptr,

382

vector_sum_row != nullptr ? vector_sum_row->clone().get() : nullptr,

383

a_offset, b_offset)

384

.first); // NOLINT

Gian Marco

e75a02b

2017-11-08 12:24:09 +0000

[diff] [blame]

385

Georgios Pinitas

631c41a

2017-12-06 11:53:03 +0000

[diff] [blame]

386

return Status{};

Gian Marco

e75a02b

2017-11-08 12:24:09 +0000

[diff] [blame]

387

}

388

389

void NEGEMMLowpOffsetContributionKernel::run(const Window &window, const ThreadInfo &info)

390

{

391

ARM_COMPUTE_UNUSED(info);

392

ARM_COMPUTE_ERROR_ON_UNCONFIGURED_KERNEL(this);

393

ARM_COMPUTE_ERROR_ON_INVALID_SUBWINDOW(INEKernel::window(), window);

394

Georgios Pinitas

bb081ca

2018-11-08 10:22:01 +0000

[diff] [blame]

395

// Check if input is a 3D reinterpretation

396

const bool reinterpret_as_3d = _vector_sum_row != nullptr

397

&& _mm_result->info()->num_dimensions() > 1

398

&& _mm_result->info()->tensor_shape().y() != _vector_sum_row->info()->tensor_shape().x();

Gian Marco

e75a02b

2017-11-08 12:24:09 +0000

[diff] [blame]

399

Michalis Spyrou

0028d7c

2020-06-22 13:45:17 +0100

[diff] [blame^]

400

run_offset_contribution(window, _mm_result, _vector_sum_col, _vector_sum_row, _a_offset, _b_offset, _k_offset, _slide_vector_sum_col, reinterpret_as_3d);

401

}