Blame - reference_model/src/ops/tensor_ops.cc - tosa/reference_model

2020-10-13 16:11:07 -0700

[diff] [blame]

391

{

392

ETensor1<int32_t> result(out_size);

393

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

394

result.setConstant(kernel_size);

395

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

396

// adjust divisors on the left side for padding

397

// We start at the leftmost output element, and remove pad_left - (index * stride) elements

398

// until we have no more padding being used

Eric Kunze

67a9155

2022-02-02 11:27:21 -0800

[diff] [blame]

399

for(int index = 0; (index <= pad_left / stride) && (index < out_size); index++) {

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

400

int32_t adjust = pad_left - (index * stride);

401

result(index) -= adjust;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

402

}

403

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

404

// The process repeats on the right side. Padding starts taking effect as we

405

// near the rightmost input element. The first output element which touches

406

// padding is defined in the initialization of index below. Then we keep moving

407

// to the right, increasing padding until we get to the last output element.

408

int index = std::max(0, ((pad_left + in_size - kernel_size) / stride) + 1);

409

for (; index < out_size; index++) {

410

int32_t adjust = ((index * stride) + kernel_size) - (pad_left + in_size);

411

result(index) -= adjust;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

412

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return result;

}

// assuming input and output tensor have same scales like tflite reference

417

// so no need to scale input and output

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

418

template <DType Dtype, DType AccDtype>

419

int OpAvgPool2d<Dtype, AccDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

420

{

421

int in_batch = this->in->getShape()[0];

422

int in_height = this->in->getShape()[1];

423

int in_width = this->in->getShape()[2];

424

int in_channels = this->in->getShape()[3];

425

426

int out_batch = this->out->getShape()[0];

427

int out_height = this->out->getShape()[1];

428

int out_width = this->out->getShape()[2];

429

int out_channels = this->out->getShape()[3];

430

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

431

ERROR_IF(in_batch != out_batch, "OpAvgPool2d: tensor batch mismatch %d != %d", in_batch, out_batch);

432

ERROR_IF(in_channels != out_channels, "OpAvgPool2d: tensor channel mismatch %d != %d", in_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

433

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

434

int pad_top = this->attribute->pad()[0];

435

int pad_bottom = this->attribute->pad()[1];

436

int pad_left = this->attribute->pad()[2];

437

int pad_right = this->attribute->pad()[3];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

438

int kernel_h = this->attribute->kernel()[0];

439

int kernel_w = this->attribute->kernel()[1];

440

int stride_h = this->attribute->stride()[0];

441

int stride_w = this->attribute->stride()[1];

442

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

443

tosa::DType accum_dtype = (tosa::DType)this->attribute->accum_dtype();

444

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

445

DEBUG_INFO(OP,

446

"perform AvgPool2d, input.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], kernel=[%d,%d], "

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

447

"stride=[%d,%d], pad=[%d,%d,%d,%d], accum_dtype=%s",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

448

in_batch, in_height, in_width, in_channels, out_batch, out_height, out_width, out_channels, kernel_h,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

449

kernel_w, stride_h, stride_w, pad_top, pad_bottom, pad_left, pad_right, EnumNamesDType()[accum_dtype]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

450

451

Eigen::array<Eigen::Index, 2> im2col_input_dims;

452

im2col_input_dims[0] = kernel_h * kernel_w;

453

im2col_input_dims[1] = out_batch * out_height * out_width * out_channels;

454

455

Eigen::array<Eigen::Index, 4> col2im_output_dims;

456

col2im_output_dims[0] = out_batch;

457

col2im_output_dims[1] = out_height;

458

col2im_output_dims[2] = out_width;

459

col2im_output_dims[3] = out_channels;

460

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

461

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

462

pad[0] = std::make_pair(0, 0);

463

pad[1] = std::make_pair(pad_top, pad_bottom);

464

pad[2] = std::make_pair(pad_left, pad_right);

465

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

466

467

ETensor4<InEigenType> input_val = this->in->getTensor();

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

468

if (Dtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

469

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

470

input_val = input_val - (InEigenType)attribute->input_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

471

}

472

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

473

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

474

475

// assuming input and output have same scales

476

// so input and output scaling is not required

477

// TODO: check if this assumption TOSA made

478

479

// extract_image_patches() output [N, KH, KW, H * W, C]

480

// transpose to [KH, KW, N, H * W, C]

481

// reshape to [KH * KW, N * H * W * C]

482

ETensor2<InEigenType> input_extract_patches =

483

input_padded.extract_image_patches(kernel_h, kernel_w, stride_h, stride_w, 1, 1, Eigen::PADDING_VALID)

484

.shuffle(Eigen::array<Eigen::Index, 5>{ 1, 2, 0, 3, 4 })

485

.reshape(im2col_input_dims);

486

487

// 1D result with [N * H * W * C]

488

ETensor1<AccEigenType> out_1d(this->out->getElementCount());

out_1d.setZero();

// sum pool

for (size_t i = 0; i < this->out->getElementCount(); i++)

493

{

494

for (int32_t j = 0; j < kernel_h * kernel_w; j++)

495

{

496

out_1d(i) += (AccEigenType)input_extract_patches(j, i);

}

}

// reshape result to [N, H, W, C] and divide with div_map

501

ETensor4<AccEigenType> sum = out_1d.reshape(col2im_output_dims);

502

503

// calculate 1d height/width div_map (number of elements this pooling window covers)

504

// and outer product to get 2d div_map, then reshape/broadcast to [N, H, W, C]

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

505

ETensor1<int32_t> div_map_h = calculate_div_map_1d(in_height, out_height, kernel_h, stride_h, pad_top, pad_bottom);

506

ETensor1<int32_t> div_map_w = calculate_div_map_1d(in_width, out_width, kernel_w, stride_w, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

507

Eigen::array<Eigen::IndexPair<Eigen::Index>, 1> contract_dims = { Eigen::IndexPair<Eigen::Index>(1, 0) };

508

Eigen::array<Eigen::Index, 4> bcast{ out_batch, 1, 1, out_channels };

509

510

ETensor4<int32_t> div_map =

511

div_map_h.reshape(Eigen::array<Eigen::Index, 2>{ out_height, 1 })

512

.contract(div_map_w.reshape(Eigen::array<Eigen::Index, 2>{ 1, out_width }), contract_dims)

513

.reshape(Eigen::array<Eigen::Index, 4>{ 1, out_height, out_width, 1 })

514

.broadcast(bcast);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

515

if (Dtype != DType_FLOAT && Dtype != DType_FP16)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

516

{

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

517

try

518

{

519

this->out->getTensor() = sum.binaryExpr(div_map, [](AccEigenType value, int32_t div) -> OutEigenType {

520

int32_t multiplier, shift;

521

TosaReference::QuantUtil::reciprocal_scale(div, multiplier, shift);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

522

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

523

return (OutEigenType)TosaReference::QuantUtil::apply_scale_32(value, multiplier, shift, false);

524

});

525

}

526

catch (std::string desc)

527

{

528

REQUIRE(false, "OpAvgPool2d apply_scale_32() fails: %s.", desc.c_str());

529

}

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

530

this->out->getTensor() = this->out->getTensor() + (OutEigenType)(attribute->output_zp());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

531

this->out->getTensor() = this->out->getTensor().cwiseMax((OutEigenType)QMin);

532

this->out->getTensor() = this->out->getTensor().cwiseMin((OutEigenType)QMax);

533

}

534

else

535

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

536

// Case for float-type resizes

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

537

this->out->getTensor() = (sum / div_map.template cast<AccEigenType>()).template cast<OutEigenType>();

538

}

539

540

return GraphNode::eval();

541

}

542

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

543

template <DType InDtype, DType WeightDtype, DType AccDtype>

544

OpConv2d<InDtype, WeightDtype, AccDtype>::OpConv2d(SubgraphTraverser* sgt_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

545

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

546

uint64_t id_)

547

: GraphNode(sgt_, Op_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

548

{

549

setRequiredOperands(3, 1);

550

setRequiredRank(4);

551

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

552

INIT_ATTRIBUTE(Conv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

553

}

554

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

555

template <DType InDtype, DType WeightDtype, DType AccDtype>

556

OpConv2d<InDtype, WeightDtype, AccDtype>::~OpConv2d()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

557

{

558

if (attribute)

559

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

560

}

561

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

562

template <DType InDtype, DType WeightDtype, DType AccDtype>

563

int OpConv2d<InDtype, WeightDtype, AccDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

564

{

565

if (validateRequiredOperands())

566

return 1;

567

568

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

574

if (inputs[2]->getRank() != 1)

575

{

576

printNodeValidationError("OpConv2d: bias tensor must be rank 1");

577

}

578

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

579

ERROR_IF(outputs[0]->getDtype() != AccDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

580

"OpConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

581

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

582

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

583

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

584

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

585

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

586

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

587

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

588

if (check_conv_attribute(attribute, 2 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

589

weight->getShape(), 1 /* offset_kernel */, InDtype, WeightDtype, msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

590

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

591

msg = "OpConv2d: " + msg;

592

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

599

template <DType InDtype, DType WeightDtype, DType AccDtype>

600

int OpConv2d<InDtype, WeightDtype, AccDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

601

{

602

int in_batch = this->input->getShape()[0];

603

int in_height = this->input->getShape()[1];

604

int in_width = this->input->getShape()[2];

605

int in_channels = this->input->getShape()[3];

606

607

int f_out_channels = this->weight->getShape()[0];

608

int f_height = this->weight->getShape()[1];

609

int f_width = this->weight->getShape()[2];

610

int f_in_channels = this->weight->getShape()[3];

611

612

int b_out_channels = this->bias->getShape()[0];

613

614

int out_batch = this->output->getShape()[0];

615

int out_height = this->output->getShape()[1];

616

int out_width = this->output->getShape()[2];

617

int out_channels = this->output->getShape()[3];

618

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

619

ERROR_IF(in_batch != out_batch, "OpConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

620

ERROR_IF(f_in_channels != in_channels, "OpConv2d: tensor input channel mismatch %d != %d", f_in_channels,

621

in_channels);

622

ERROR_IF(f_out_channels != out_channels, "OpConv2d: tensor output channel mismatch %d != %d", f_out_channels,

623

out_channels);

624

ERROR_IF(b_out_channels != out_channels, "OpConv2d: bias channel mismatch %d != %d", b_out_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

625

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

626

int pad_top = this->attribute->pad()[0];

627

int pad_bottom = this->attribute->pad()[1];

628

int pad_left = this->attribute->pad()[2];

629

int pad_right = this->attribute->pad()[3];

630

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

631

int stride_h = this->attribute->stride()[0];

632

int stride_w = this->attribute->stride()[1];

633

int dilation_h = this->attribute->dilation()[0];

634

int dilation_w = this->attribute->dilation()[1];

635

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

636

tosa::DType accum_dtype = (tosa::DType)this->attribute->accum_dtype();

637

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

638

DEBUG_INFO(OP,

639

"perform OpConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], "

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

640

"stride=[%d,%d], dilation=[%d,%d], pad=[%d,%d,%d,%d], accum_dtype=%s",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

641

in_batch, in_height, in_width, in_channels, f_height, f_width, f_in_channels, f_out_channels, out_batch,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

642

out_height, out_width, out_channels, stride_h, stride_w, dilation_h, dilation_w, pad_top,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

643

pad_bottom, pad_left, pad_right, EnumNamesDType()[accum_dtype]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

644

645

// GEMM-conv2d, left matrix is input, right matrix is weight

646

Eigen::array<Eigen::Index, 2> im2col_input_dims;

647

im2col_input_dims[0] = out_batch * out_height * out_width;

648

im2col_input_dims[1] = f_height * f_width * f_in_channels;

649

650

Eigen::array<Eigen::Index, 2> im2col_weight_dims;

651

im2col_weight_dims[0] = f_height * f_width * f_in_channels;

652

im2col_weight_dims[1] = f_out_channels;

653

654

Eigen::array<Eigen::Index, 2> bias_reshaped_dims;

655

bias_reshaped_dims[0] = 1;

656

bias_reshaped_dims[1] = b_out_channels;

657

658

Eigen::array<Eigen::Index, 4> weight_zp_bcast_dims;

659

weight_zp_bcast_dims[0] = f_height;

660

weight_zp_bcast_dims[1] = f_width;

661

weight_zp_bcast_dims[2] = f_in_channels;

662

663

Eigen::array<Eigen::Index, 2> bias_bcast_dims;

664

bias_bcast_dims[0] = out_batch * out_height * out_width;

665

bias_bcast_dims[1] = 1;

666

667

Eigen::array<Eigen::Index, 4> col2im_output_dims;

668

col2im_output_dims[0] = out_batch;

669

col2im_output_dims[1] = out_height;

670

col2im_output_dims[2] = out_width;

671

col2im_output_dims[3] = out_channels;

672

673

Eigen::array<Eigen::IndexPair<Eigen::Index>, 1> contract_dims = { Eigen::IndexPair<Eigen::Index>(1, 0) };

674

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

675

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

676

pad[0] = std::make_pair(0, 0);

677

pad[1] = std::make_pair(pad_top, pad_bottom);

678

pad[2] = std::make_pair(pad_left, pad_right);

679

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

680

681

TIn input_val = this->input->getTensor();

682

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

683

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

684

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

685

input_val = input_val - (InEigenType)attribute->input_zp();

686

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

687

}

688

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

689

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

690

691

// extract_image_patches() output [N, KH, KW, H * W, C]

692

// need to transpose to [N, H * W, KH, KW, C]

693

ETensor5<InEigenType> input_extract_patches =

694

input_padded

695

.extract_image_patches(f_height, f_width, stride_h, stride_w, dilation_h, dilation_w, Eigen::PADDING_VALID)

696

.shuffle(Eigen::array<Eigen::Index, 5>{ 0, 3, 1, 2, 4 });

697

698

// reshape input to [N * H * W, KH * KW * C]

699

ETensor2<InEigenType> im2col_input = input_extract_patches.reshape(im2col_input_dims);

700

701

// transpose and reshape weight from [OC, H, W, IC] to [H * W * IC, OC]

702

ETensor2<WeightEigenType> im2col_weight =

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

703

weight_val.shuffle(Eigen::array<Eigen::Index, 4>({ 1, 2, 3, 0 })).reshape(im2col_weight_dims);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

704

705

// don't need to apply bias_multiplier ( * bias_scale and >> bias_shift) since tflite already scale it

706

// and reshaped from [C] to [1, C], and broadcast to [N * H * W, C]

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

707

ETensor2<OutEigenType> bias_2d = (this->bias->getTensor().reshape(bias_reshaped_dims).broadcast(bias_bcast_dims)).template cast<OutEigenType>();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

708

709

// output matrix is [N * H * W, C]

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

710

ETensor2<OutEigenType> contracted_result =

711

(im2col_input.template cast<AccEigenType>().contract(im2col_weight.template cast<AccEigenType>(), contract_dims)).template cast<OutEigenType>();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

712

713

// adding bias

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

714

ETensor2<OutEigenType> biased_output = contracted_result + bias_2d;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

715

716

// reshape back to [N, H, W, C]

717

this->output->getTensor() = biased_output.reshape(col2im_output_dims);

718

719

if (AccDtype == DType_INT48)

720

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

721

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

722

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

723

}

724

725

return GraphNode::eval();

726

}

727

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

728

template <DType InDtype, DType WeightDtype, DType AccDtype>

729

OpConv3d<InDtype, WeightDtype, AccDtype>::OpConv3d(SubgraphTraverser* sgt_,

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

730

TosaAttributeBase* attribute_,

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

731

uint64_t id_)

732

: GraphNode(sgt_, Op_CONV3D, id_)

733

{

734

setRequiredOperands(3, 1);

735

setRequiredRank(5);

736

737

INIT_ATTRIBUTE(Conv);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

738

}

739

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

740

template <DType InDtype, DType WeightDtype, DType AccDtype>

741

OpConv3d<InDtype, WeightDtype, AccDtype>::~OpConv3d()

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

742

{

743

if (attribute)

744

delete attribute;

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

745

}

746

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

747

template <DType InDtype, DType WeightDtype, DType AccDtype>

748

int OpConv3d<InDtype, WeightDtype, AccDtype>::checkTensorAttributes()

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

749

{

750

if (validateRequiredOperands())

751

return 1;

752

753

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

759

if (inputs[2]->getRank() != 1)

760

{

761

printNodeValidationError("OpConv3d: bias tensor must be rank 1");

762

}

763

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

764

ERROR_IF(outputs[0]->getDtype() != AccDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

765

"OpConv3d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

766

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

767

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

768

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

769

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

770

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

771

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

772

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

773

if (check_conv_attribute(attribute, 3 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

774

weight->getShape(), 1 /* offset_kernel */, InDtype, WeightDtype, msg))

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

775

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

776

msg = "OpConv3d: " + msg;

777

printNodeValidationError(msg.c_str());

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

return 1;

}

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

return 0;

}

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

784

template <DType InDtype, DType WeightDtype, DType AccDtype>

785

int OpConv3d<InDtype, WeightDtype, AccDtype>::eval()

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

786

{

787

int in_batch = this->input->getShape()[0];

788

int in_depth = this->input->getShape()[1];

789

int in_height = this->input->getShape()[2];

790

int in_width = this->input->getShape()[3];

791

int in_channels = this->input->getShape()[4];

792

793

int f_out_channels = this->weight->getShape()[0];

794

int f_depth = this->weight->getShape()[1];

795

int f_height = this->weight->getShape()[2];

796

int f_width = this->weight->getShape()[3];

797

int f_in_channels = this->weight->getShape()[4];

798

799

int b_out_channels = this->bias->getShape()[0];

800

801

int out_batch = this->output->getShape()[0];

802

int out_depth = this->output->getShape()[1];

803

int out_height = this->output->getShape()[2];

804

int out_width = this->output->getShape()[3];

805

int out_channels = this->output->getShape()[4];

806

807

ERROR_IF(in_batch != out_batch, "OpConv3d: tensor batch mismatch %d != %d", in_batch, out_batch);

808

ERROR_IF(f_in_channels != in_channels, "OpConv3d: tensor input channel mismatch %d != %d", f_in_channels,

809

in_channels);

810

ERROR_IF(f_out_channels != out_channels, "OpConv3d: tensor output channel mismatch %d != %d", f_out_channels,

811

out_channels);

812

ERROR_IF(b_out_channels != out_channels, "OpConv3d: bias channel mismatch %d != %d", b_out_channels, out_channels);

813

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

814

int pad_d0 = this->attribute->pad()[0];

815

int pad_d1 = this->attribute->pad()[1];

816

int pad_top = this->attribute->pad()[2];

817

int pad_bottom = this->attribute->pad()[3];

818

int pad_left = this->attribute->pad()[4];

819

int pad_right = this->attribute->pad()[5];

820

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

821

int stride_d = this->attribute->stride()[0];

822

int stride_h = this->attribute->stride()[1];

823

int stride_w = this->attribute->stride()[2];

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

824

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

825

int dilation_d = this->attribute->dilation()[0];

826

int dilation_h = this->attribute->dilation()[1];

827

int dilation_w = this->attribute->dilation()[2];

828

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

829

tosa::DType accum_dtype = (tosa::DType)this->attribute->accum_dtype();

830

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

831

DEBUG_INFO(

832

OP,

833

"perform OpConv3d, input.shape=[%d,%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d,%d], output.shape=[%d,%d,%d,%d,%d], "

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

834

"stride=[%d,%d,%d], dilation=[%d,%d,%d], pad=[%d,%d,%d,%d,%d,%d], accum_dtype=%s",

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

835

in_batch, in_depth, in_height, in_width, in_channels, f_out_channels, f_depth, f_height, f_width, f_in_channels,

836

out_batch, out_depth, out_height, out_width, out_channels, stride_d, stride_h, stride_w, dilation_d, dilation_h,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

837

dilation_w, pad_d0, pad_d1, pad_top, pad_bottom, pad_left, pad_right, EnumNamesDType()[accum_dtype]);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

838

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

839

Eigen::array<std::pair<int32_t, int32_t>, 5> pad;

840

pad[0] = std::make_pair(0, 0);

841

pad[1] = std::make_pair(pad_d0, pad_d1);

842

pad[2] = std::make_pair(pad_top, pad_bottom);

843

pad[3] = std::make_pair(pad_left, pad_right);

844

pad[4] = std::make_pair(0, 0);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

845

846

TIn input_val = this->input->getTensor();

847

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

848

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

849

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

850

input_val = input_val - (InEigenType)attribute->input_zp();

851

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

852

}

853

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

854

ETensor5<InEigenType> input_padded = input_val.pad(pad);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

855

856

// 1. initialize with bias

857

Eigen::array<Eigen::Index, 5> reshape_dim;

858

reshape_dim.fill(1);

859

reshape_dim[4] = b_out_channels;

860

861

Eigen::array<Eigen::Index, 5> bcast;

862

bcast[0] = out_batch;

863

bcast[1] = out_depth;

864

bcast[2] = out_height;

865

bcast[3] = out_width;

866

bcast[4] = 1;

867

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

868

869

// 2. direct convolution

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

870

AccEigenType acc(0.0);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

871

int d_idx, h_idx, w_idx;

872

873

for (int ob = 0; ob < out_batch; ob++)

874

{

875

for (int od = 0; od < out_depth; od++)

876

{

877

for (int oh = 0; oh < out_height; oh++)

878

{

879

for (int ow = 0; ow < out_width; ow++)

880

{

881

for (int oc = 0; oc < out_channels; oc++)

882

{

Eric Kunze

7edb34c

2022-05-16 17:34:40 -0700

[diff] [blame]

883

// Initialize accumulator with bias value

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

884

acc = (AccEigenType)this->output->getTensor()(ob, od, oh, ow, oc);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

885

for (int fd = 0; fd < f_depth; fd++)

886

{

887

d_idx = od * stride_d + fd * dilation_d;

888

for (int fh = 0; fh < f_height; fh++)

889

{

890

h_idx = oh * stride_h + fh * dilation_h;

891

for (int fw = 0; fw < f_width; fw++)

892

{

893

w_idx = ow * stride_w + fw * dilation_w;

894

for (int ic = 0; ic < in_channels; ic++)

895

{

896

acc += ((AccEigenType)input_padded(ob, d_idx, h_idx, w_idx, ic) *

897

(AccEigenType)weight_val(oc, fd, fh, fw, ic));

}

}

}

}

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

902

this->output->getTensor()(ob, od, oh, ow, oc) = (OutEigenType)acc;

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

}

}

}

}

}

if (AccDtype == DType_INT48)

910

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

911

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

912

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

913

}

914

915

return GraphNode::eval();

916

}

917

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

918

template <DType InDtype, DType WeightDtype, DType AccDtype>

919

OpDepthwiseConv2d<InDtype, WeightDtype, AccDtype>::OpDepthwiseConv2d(SubgraphTraverser* sgt_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

920

TosaAttributeBase* attribute_,

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

921

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

922

: GraphNode(sgt_, Op_DEPTHWISE_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

923

{

924

setRequiredOperands(3, 1);

925

setRequiredRank(4);

926

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

927

INIT_ATTRIBUTE(Conv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

928

}

929

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

930

template <DType InDtype, DType WeightDtype, DType AccDtype>

931

OpDepthwiseConv2d<InDtype, WeightDtype, AccDtype>::~OpDepthwiseConv2d()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

932

{

933

if (attribute)

934

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

935

}

936

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

937

template <DType InDtype, DType WeightDtype, DType AccDtype>

938

int OpDepthwiseConv2d<InDtype, WeightDtype, AccDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

939

{

940

if (validateRequiredOperands())

941

return 1;

942

943

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

949

if (inputs[2]->getRank() != 1)

950

{

951

printNodeValidationError("OpDepthwiseConv2d: bias tensor must be rank 1");

952

}

953

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

954

ERROR_IF(outputs[0]->getDtype() != AccDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

955

"OpDepthwiseConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

956

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

957

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

958

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

959

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

960

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

961

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

962

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

963

if (check_conv_attribute(attribute, 2 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

964

weight->getShape(), 0 /* offset_kernel */, InDtype, WeightDtype, msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

965

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

966

msg = "OpDepthwiseConv2d: " + msg;

967

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

974

template <DType InDtype, DType WeightDtype, DType AccDtype>

975

int OpDepthwiseConv2d<InDtype, WeightDtype, AccDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

976

{

977

int in_batch = this->input->getShape()[0];

978

int in_height = this->input->getShape()[1];

979

int in_width = this->input->getShape()[2];

980

int in_channels = this->input->getShape()[3];

981

982

int f_height = this->weight->getShape()[0];

983

int f_width = this->weight->getShape()[1];

984

int f_in_channels = this->weight->getShape()[2];

985

int f_multiplier = this->weight->getShape()[3];

986

987

int b_out_channels = this->bias->getShape()[0];

988

989

int out_batch = this->output->getShape()[0];

990

int out_height = this->output->getShape()[1];

991

int out_width = this->output->getShape()[2];

992

int out_channels = this->output->getShape()[3];

993

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

994

ERROR_IF(in_batch != out_batch, "OpDepthwiseConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

995

ERROR_IF(f_in_channels != in_channels, "OpDepthwiseConv2d: tensor input channel mismatch %d != %d", f_in_channels,

996

in_channels);

997

ERROR_IF(in_channels * f_multiplier != out_channels, "OpDepthwiseConv2d: tensor output channel mismatch %d != %d",

998

in_channels * f_multiplier, out_channels);

999

ERROR_IF(b_out_channels != out_channels, "OpDepthwiseConv2d: bias channels mismatch %d != %d", b_out_channels,

1000

out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1001

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1002

int pad_top = this->attribute->pad()[0];

1003

int pad_bottom = this->attribute->pad()[1];

1004

int pad_left = this->attribute->pad()[2];

1005

int pad_right = this->attribute->pad()[3];

1006

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1007

int stride_h = this->attribute->stride()[0];

1008

int stride_w = this->attribute->stride()[1];

1009

int dilation_h = this->attribute->dilation()[0];

1010

int dilation_w = this->attribute->dilation()[1];

1011

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1012

tosa::DType accum_dtype = (tosa::DType)this->attribute->accum_dtype();

1013

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1014

DEBUG_INFO(OP,

1015

"perform OpDepthwiseConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], "

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1016

"output.shape=[%d,%d,%d,%d], stride=[%d,%d], dilation=[%d,%d], pad=[%d,%d,%d,%d], accum_dtype=%s",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1017

in_batch, in_height, in_width, in_channels, f_height, f_width, f_in_channels, f_multiplier, out_batch,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1018

out_height, out_width, out_channels, stride_h, stride_w, dilation_h, dilation_w, pad_top,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1019

pad_bottom, pad_left, pad_right, EnumNamesDType()[accum_dtype]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1020

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1021

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

1022

pad[0] = std::make_pair(0, 0);

1023

pad[1] = std::make_pair(pad_top, pad_bottom);

1024

pad[2] = std::make_pair(pad_left, pad_right);

1025

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1026

1027

TIn input_val = this->input->getTensor();

1028

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

1029

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1030

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1031

input_val = input_val - (InEigenType)attribute->input_zp();

1032

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1033

}

1034

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1035

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1036

1037

// GEMM doesn't fit well with DepthwiseConv2d

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1038

// 1. use extract_image_patches() to handle stride/dilation/pad

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1039

// 2. perform direct convolution

1040

1041

// 1. extract_image_patches() output [N, KH, KW, OH * OW, IC]

1042

ETensor5<InEigenType> input_extract_patches = input_padded.extract_image_patches(

1043

f_height, f_width, stride_h, stride_w, dilation_h, dilation_w, Eigen::PADDING_VALID);

1044

1045

Eigen::array<Eigen::Index, 4> reshape_dim;

1046

reshape_dim.fill(1);

1047

reshape_dim[3] = b_out_channels;

1048

1049

Eigen::array<Eigen::Index, 4> bcast;

1050

bcast[0] = out_batch;

1051

bcast[1] = out_height;

1052

bcast[2] = out_width;

1053

bcast[3] = 1;

1054

1055

// initialize with bias

1056

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

1057

1058

// 2. direct depthwise convolution

1059

for (int ob = 0; ob < out_batch; ob++)

1060

{

1061

for (int oh = 0; oh < out_height; oh++)

1062

{

1063

for (int ow = 0; ow < out_width; ow++)

1064

{

1065

for (int ic = 0; ic < in_channels; ic++)

1066

{

1067

for (int cm = 0; cm < f_multiplier; cm++)

1068

{

1069

for (int fh = 0; fh < f_height; fh++)

1070

{

1071

for (int fw = 0; fw < f_width; fw++)

1072

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1073

// Perform multiplication in AccEigenType then cast to OutEigenType

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1074

this->output->getTensor()(ob, oh, ow, ic * f_multiplier + cm) +=

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1075

(OutEigenType)((AccEigenType)input_extract_patches(ob, fh, fw, ow * out_height + oh, ic) *

1076

(AccEigenType)weight_val(fh, fw, ic, cm));

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

}

}

}

}

}

}

}

if (AccDtype == DType_INT48)

1086

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1087

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

1088

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1089

}

1090

1091

return GraphNode::eval();

1092

}

1093

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1094

template <DType InDtype, DType WeightDtype, DType AccDtype>

1095

OpFullyConnected<InDtype, WeightDtype, AccDtype>::OpFullyConnected(SubgraphTraverser* sgt_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1096

TosaAttributeBase* attribute_,

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1097

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1098

: GraphNode(sgt_, Op_FULLY_CONNECTED, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1099

{

1100

setRequiredOperands(3, 1);

1101

setRequiredRank(2);

1102

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1103

INIT_ATTRIBUTE(FullyConnected);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1104

}

1105

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1106

template <DType InDtype, DType WeightDtype, DType AccDtype>

1107

OpFullyConnected<InDtype, WeightDtype, AccDtype>::~OpFullyConnected()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1108

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1109

if (attribute)

1110

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1111

}

1112

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1113

template <DType InDtype, DType WeightDtype, DType AccDtype>

1114

int OpFullyConnected<InDtype, WeightDtype, AccDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1115

{

1116

if (validateRequiredOperands())

1117

return 1;

1118

1119

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1125

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

1126

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

1127

1128

if (input->getShape()[1] != weight->getShape()[1])

1129

{

1130

printNodeValidationError("OpFullyConnected operator input.shape[1] should match weight.shape[1]");

return 1;

}

if (weight->getShape()[0] != bias->getShape()[0])

1135

{

1136

printNodeValidationError("OpFullyConnected operator bias.shape[0] should match weight.shape[0]");

return 1;

}

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1140

ERROR_IF(outputs[0]->getDtype() != AccDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1141

"OpFullyConnected: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1142

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1143

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1144

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1145

ERROR_IF(InDtype != DType_INT8 && attribute->input_zp() != 0, "OpFullyConnected: Input zeropoint must be zero for non int8_t data");

1146

ERROR_IF(WeightDtype != DType_INT8 && attribute->weight_zp() != 0, "OpFullyConnected: Weight zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1147

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1151

template <DType InDtype, DType WeightDtype, DType AccDtype>

1152

int OpFullyConnected<InDtype, WeightDtype, AccDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1153

{

1154

typedef Eigen::Tensor<int, 1>::DimensionPair DimPair;

1155

Eigen::array<DimPair, 1> dims{ { DimPair(1, 0) } };

1156

1157

Eigen::array<Eigen::Index, 2> weight_shuffle{ 1, 0 };

1158

1159

Eigen::array<Eigen::Index, 2> bias_reshape;

1160

bias_reshape[0] = 1;

1161

bias_reshape[1] = this->bias->getShape()[0];

1162

1163

Eigen::array<Eigen::Index, 2> bias_bcast;

1164

bias_bcast[0] = this->input->getShape()[0];

1165

bias_bcast[1] = 1;

1166

1167

TIn input_val = this->input->getTensor();

1168

TWeight weight_val = this->weight->getTensor().shuffle(weight_shuffle);

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

1169

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1170

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1171

input_val = input_val - (InEigenType)attribute->input_zp();

1172

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1173

}

1174

1175

this->output->getTensor() =

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1176

input_val.template cast<AccEigenType>().contract(weight_val.template cast<AccEigenType>(), dims).template cast<OutEigenType>() +

1177

this->bias->getTensor().reshape(bias_reshape).broadcast(bias_bcast);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1178

1179

if (AccDtype == DType_INT48)

1180

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1181

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

1182

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1183

}

1184

return GraphNode::eval();

1185

}

1186

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1187

template <DType Dtype, DType AccDtype>

1188

OpMatMul<Dtype, AccDtype>::OpMatMul(SubgraphTraverser* sgt_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1189

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1190

uint64_t id_)

1191

: GraphNode(sgt_, Op_MATMUL, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1192

{

1193

setRequiredOperands(2, 1);

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1194

setRequiredRank(3);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1195

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1196

INIT_ATTRIBUTE(MatMul);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1197

}

1198

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1199

template <DType Dtype, DType AccDtype>

1200

OpMatMul<Dtype, AccDtype>::~OpMatMul()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1201

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1202

if (attribute)

1203

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1204

}

1205

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1206

template <DType Dtype, DType AccDtype>

1207

int OpMatMul<Dtype, AccDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1208

{

1209

if (validateRequiredOperands())

1210

return 1;

1211

1212

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1217

ERROR_IF(outputs[0]->getDtype() != AccDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1218

"OpMatMul: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1219

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1220

a = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1221

b = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[1]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1222

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1223

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1224

ASSERT_MEM(a && b && output);

// a: [N, H, C]

// b: [N, C, W]

// c: [N, H, W]

// Check N

if (a->getShape()[0] != b->getShape()[0] || a->getShape()[0] != output->getShape()[0])

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1232

{

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1233

printNodeValidationError("OpMatMul operator a.shape[0], b.shape[0] and output.shape[0] should match");

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1234

return 1;

1235

}

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1236

N = a->getShape()[0];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1237

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1238

// Check C

1239

if (a->getShape()[2] != b->getShape()[1])

1240

{

1241

printNodeValidationError("OpMatMul operator a.shape[2] should match b.shape[1]");

1242

return 1;

1243

}

1244

C = a->getShape()[2];

1245

1246

// Check H

1247

if (a->getShape()[1] != output->getShape()[1])

1248

{

1249

printNodeValidationError("OpMatMul operator a.shape[1] should match output.shape[1]");

1250

return 1;

1251

}

1252

H = a->getShape()[1];

1253

1254

// Check W

1255

if (b->getShape()[2] != output->getShape()[2])

1256

{

1257

printNodeValidationError("OpMatMul operator output.shape[2] should match output.shape[2]");

1258

return 1;

1259

}

1260

W = b->getShape()[2];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1261

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1262

ERROR_IF(Dtype != DType_INT8 && attribute->a_zp() != 0, "OpMatMul: A zeropoint must be zero for non int8_t data");

1263

ERROR_IF(Dtype != DType_INT8 && attribute->b_zp() != 0, "OpMatMul: B zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1264

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1268

template <DType Dtype, DType AccDtype>

1269

int OpMatMul<Dtype, AccDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1270

{

1271

typedef Eigen::Tensor<int, 1>::DimensionPair DimPair;

1272

Eigen::array<DimPair, 1> dims{ { DimPair(1, 0) } };

1273

1274

TIn a_val = this->a->getTensor();

1275

TIn b_val = this->b->getTensor();

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1276

if (Dtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1277

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1278

a_val = a_val - (InEigenType)attribute->a_zp();

1279

b_val = b_val - (InEigenType)attribute->b_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1280

}

1281

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1282

Eigen::array<Eigen::Index, 2> a_rank2_shape({ H, C });

1283

Eigen::array<Eigen::Index, 2> b_rank2_shape({ C, W });

1284

Eigen::array<Eigen::Index, 3> output_rank3_shape({ 1, H, W });

1285

1286

Eigen::array<Eigen::Index, 3> a_size_array({ 1, H, C });

1287

Eigen::array<Eigen::Index, 3> b_size_array({ 1, C, W });

1288

1289

Eigen::array<Eigen::Index, 3> a_begin_array({ 0, 0, 0 });

1290

Eigen::array<Eigen::Index, 3> b_begin_array({ 0, 0, 0 });

1291

1292

// Iterate N dimension.

1293

for (int i = 0; i < N; i++)

1294

{

1295

a_begin_array[0] = i;

1296

b_begin_array[0] = i;

1297

1298

TInRank2 a_rank2_val = a_val.slice(a_begin_array, a_size_array).reshape(a_rank2_shape);

1299

TInRank2 b_rank2_val = b_val.slice(b_begin_array, b_size_array).reshape(b_rank2_shape);

1300

TAccRank2 output_rank2_val =

1301

a_rank2_val.template cast<AccEigenType>().contract(b_rank2_val.template cast<AccEigenType>(), dims);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1302

TOut output_rank3_val = output_rank2_val.reshape(output_rank3_shape).template cast<OutEigenType>();

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1303

if (i == 0)

1304

{

1305

this->output->getTensor() = output_rank3_val;

1306

}

1307

else

1308

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1309

TOut temp = this->output->getTensor().concatenate(output_rank3_val, 0);

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1310

this->output->getTensor() = temp;

1311

}

1312

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1313

1314

if (AccDtype == DType_INT48)

1315

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1316

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

1317

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1318

}

1319

1320

return GraphNode::eval();

1321

}

1322

1323

template <DType Dtype>

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1324

OpMaxPool2d<Dtype>::OpMaxPool2d(SubgraphTraverser* sgt_,

1325

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1326

uint64_t id_)

1327

: GraphNode(sgt_, Op_MAX_POOL2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1328

{

1329

setRequiredOperands(1, 1);

1330

setRequiredRank(4);

1331

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

1332

INIT_ATTRIBUTE(Pool);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1333

}

1334

1335

template <DType Dtype>

1336

OpMaxPool2d<Dtype>::~OpMaxPool2d()

{

if (attribute)

delete attribute;

}

template <DType Dtype>

1343

int OpMaxPool2d<Dtype>::checkTensorAttributes()

1344

{

1345

if (validateRequiredOperands())

1346

return 1;

1347

1348

if (validateRequiredRank(inputs[0]) || validateRequiredRank(outputs[0]))

{

return 1;

}

if (inputs[0]->matchType(*outputs[0]))

1354

{

1355

printNodeValidationError("OpMaxPool2d: input and output tensor type mismatch");

return 1;

}

in = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1360

out = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

1361

Kevin Cheng

7eb93d7

2021-10-09 01:26:08 +0000

[diff] [blame]

1362

std::string msg;

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

1363

if (check_pool2d_attribute(attribute, in->getShape(), out->getShape(), msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1364

{

Kevin Cheng

7eb93d7

2021-10-09 01:26:08 +0000

[diff] [blame]

1365

msg = "OpMaxPool2d: " + msg;

1366

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

return 0;

}

template <DType Dtype>

1374

int OpMaxPool2d<Dtype>::eval()

1375

{

1376

int in_batch = this->in->getShape()[0];

1377

int in_height = this->in->getShape()[1];

1378

int in_width = this->in->getShape()[2];

1379

int in_channels = this->in->getShape()[3];

1380

1381

int out_batch = this->out->getShape()[0];

1382

int out_height = this->out->getShape()[1];

1383

int out_width = this->out->getShape()[2];

1384

int out_channels = this->out->getShape()[3];

1385

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1386

ERROR_IF(in_batch != out_batch, "OpMaxPool2d: tensor batch mismatch %d != %d", in_batch, out_batch);

1387

ERROR_IF(in_channels != out_channels, "OpMaxPool2d: tensor channel mismatch %d != %d", in_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1388

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1389

int pad_top = this->attribute->pad()[0];

1390

int pad_bottom = this->attribute->pad()[1];

1391

int pad_left = this->attribute->pad()[2];

1392

int pad_right = this->attribute->pad()[3];

1393

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1394

int kernel_h = this->attribute->kernel()[0];

1395

int kernel_w = this->attribute->kernel()[1];

1396

int stride_h = this->attribute->stride()[0];

1397

int stride_w = this->attribute->stride()[1];

1398

1399

DEBUG_INFO(OP,

1400

"perform MaxPool2d, input.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], kernel=[%d,%d], "

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1401

"stride=[%d,%d], pad=[%d,%d,%d,%d]",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1402

in_batch, in_height, in_width, in_channels, out_batch, out_height, out_width, out_channels, kernel_h,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1403

kernel_w, stride_h, stride_w, pad_top, pad_bottom, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1404

1405

Eigen::array<Eigen::Index, 2> im2col_input_dims;

1406

im2col_input_dims[0] = kernel_h * kernel_w;

1407

im2col_input_dims[1] = out_batch * out_height * out_width * out_channels;

1408

1409

Eigen::array<Eigen::Index, 4> col2im_output_dims;

1410

col2im_output_dims[0] = out_batch;

1411

col2im_output_dims[1] = out_height;

1412

col2im_output_dims[2] = out_width;

1413

col2im_output_dims[3] = out_channels;

1414

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1415

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

1416

pad[0] = std::make_pair(0, 0);

1417

pad[1] = std::make_pair(pad_top, pad_bottom);

1418

pad[2] = std::make_pair(pad_left, pad_right);

1419

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1420

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1421

ETensor4<InEigenType> input_padded = this->in->getTensor().pad(pad, std::numeric_limits<InEigenType>::lowest());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1422

1423

// extract_image_patches() output [N, KH, KW, H * W, C]

1424

// transpose to [KH, KW, N, H * W, C]

1425

// reshape to [KH * KW, N * H * W * C]

1426

//

1427

// Set the padding value to be the most negative value that can be

1428

// represented by the datatype to ensure that any padding values will be equal

1429

// to or smaller than the actual maximum in the KH x KW patch.

1430

ETensor2<InEigenType> input_extract_patches =

1431

input_padded

1432

.extract_image_patches(kernel_h, kernel_w, stride_h, stride_w, 1, 1, Eigen::PADDING_VALID,

1433

std::numeric_limits<InEigenType>::lowest())

1434

.shuffle(Eigen::array<Eigen::Index, 5>{ 1, 2, 0, 3, 4 })

1435

.reshape(im2col_input_dims);

1436

1437

// Get the maximum of the KHxHW patches along axis 0

1438

Eigen::Tensor<DenseIndex, 1> tensor_argmax = input_extract_patches.argmax(0);

1439

1440

// 1D result with [N * H * W * C]

1441

ETensor1<OutEigenType> out_1d(this->out->getElementCount());

1442

1443

// index input_patches with argmax array should give the result

1444

for (size_t i = 0; i < this->out->getElementCount(); i++)

1445

{

1446

out_1d(i) = (OutEigenType)input_extract_patches(tensor_argmax(i), i);

1447

}

1448

1449

// reshape result to [N, H, W, C]

1450

this->out->getTensor() = out_1d.reshape(col2im_output_dims);

1451

1452

return GraphNode::eval();

1453

}

1454

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1455

template <DType InDtype, DType WeightDtype, DType AccDtype>

1456

OpTransposeConv2d<InDtype, WeightDtype, AccDtype>::OpTransposeConv2d(SubgraphTraverser* sgt_,

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1457

TosaAttributeBase* attribute_,

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1458

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1459

: GraphNode(sgt_, Op_TRANSPOSE_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1460

{

1461

setRequiredOperands(3, 1);

1462

setRequiredRank(4);

1463

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

1464

INIT_ATTRIBUTE(TransposeConv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1465

}

1466

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1467

template <DType InDtype, DType WeightDtype, DType AccDtype>

1468

OpTransposeConv2d<InDtype, WeightDtype, AccDtype>::~OpTransposeConv2d()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1469

{

1470

if (attribute)

1471

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1472

}

1473

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1474

template <DType InDtype, DType WeightDtype, DType AccDtype>

1475

int OpTransposeConv2d<InDtype, WeightDtype, AccDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1476

{

1477

if (validateRequiredOperands())

1478

return 1;

1479

1480

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1485

ERROR_IF(outputs[0]->getDtype() != AccDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1486

"OpTransposeConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1487

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1488

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1489

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

1490

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1491

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1492

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1493

if (attribute->out_pad().size() != 4)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1494

{

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1495

printNodeValidationError("OpTransposeConv2d: illegal size for attribute out_pad");

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

if (attribute->stride().size() != 2)

1500

{

1501

printNodeValidationError("OpTransposeConv2d: illegal size for attribute stride");

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1505

if (attribute->output_shape().size() != 4)

1506

{

1507

printNodeValidationError("OpTransposeConv2d: illegal size for attribute output_shape");

return 1;

}

Eric Kunze

2022-07-01 16:56:09 -0700

[diff] [blame]

1511

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

1512

1513

for (int32_t i : attribute->stride())

{

if (i < 1)

{

printNodeValidationError("OpTransposeConv2d: At least one stride is smaller than one");

return 1;

}

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1522

for (int d = 0; d < 4; d++)

1523

{

1524

if (attribute->output_shape()[d] != this->output->getShape()[d])

1525

{

1526

printNodeValidationError("OpTransposeConv2d: illegal size for attribute output_shape");

return 1;

}

}

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1531

int32_t IH = input->getShape()[1];

1532

int32_t IW = input->getShape()[2];

1533

int32_t OH = output->getShape()[1];

1534

int32_t OW = output->getShape()[2];

1535

1536

int32_t stride_y = attribute->stride()[0];

1537

int32_t stride_x = attribute->stride()[1];

1538

int32_t kernel_h = weight->getShape()[1];

1539

int32_t kernel_w = weight->getShape()[2];

1540

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1541

int32_t out_pad_top = attribute->out_pad()[0];

1542

int32_t out_pad_bottom = attribute->out_pad()[1];

1543

int32_t out_pad_left = attribute->out_pad()[2];

1544

int32_t out_pad_right = attribute->out_pad()[3];

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1545

Eric Kunze

c1a9783

2022-07-01 16:56:09 -0700

[diff] [blame]

1546

for (size_t i = 0; i < attribute->out_pad().size(); i++)

1547

{

1548

ERROR_IF(attribute->out_pad()[i] <= -(weight->getShape()[(i / 2) + 1]), "OpTransposeConv2d: At least one out_pad value is larger than kernel size");

1549

}

1550

1551

int32_t H = (IH - 1) * stride_y + out_pad_top + out_pad_bottom + kernel_h;

1552

int32_t W = (IW - 1) * stride_x + out_pad_left + out_pad_right + kernel_w;

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1553

1554

if ((OH != H) || (OW != W))

1555

{

1556

std::string msg = "OpTransposeConv2d: Mismatch between output shape provided and expected output shape (" +

1557

std::to_string(H) + "," +

1558

std::to_string(W) + ")";

1559

printNodeValidationError(msg.c_str());

return 1;

}

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1563

ERROR_IF(InDtype != DType_INT8 && attribute->input_zp() != 0, "OpTransposeConv2d: Input zeropoint must be zero for non int8_t data");

1564

ERROR_IF(WeightDtype != DType_INT8 && attribute->weight_zp() != 0, "OpTransposeConv2d: Weight zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1565

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1569

template <DType InDtype, DType WeightDtype, DType AccDtype>

1570

int OpTransposeConv2d<InDtype, WeightDtype, AccDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1571

{

1572

int in_batch = this->input->getShape()[0];

1573

int in_height = this->input->getShape()[1];

1574

int in_width = this->input->getShape()[2];

1575

int in_channels = this->input->getShape()[3];

1576

1577

int f_out_channels = this->weight->getShape()[0];

1578

int f_height = this->weight->getShape()[1];

1579

int f_width = this->weight->getShape()[2];

1580

int f_in_channels = this->weight->getShape()[3];

1581

1582

int b_out_channels = this->bias->getShape()[0];

1583

1584

int out_batch = this->output->getShape()[0];

1585

int out_height = this->output->getShape()[1];

1586

int out_width = this->output->getShape()[2];

1587

int out_channels = this->output->getShape()[3];

1588

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1589

int out_pad_top = this->attribute->out_pad()[0];

1590

int out_pad_bottom = this->attribute->out_pad()[1];

1591

int out_pad_left = this->attribute->out_pad()[2];

1592

int out_pad_right = this->attribute->out_pad()[3];

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1593

1594

int stride_h = this->attribute->stride()[0];

1595

int stride_w = this->attribute->stride()[1];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1596

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1597

tosa::DType accum_dtype = (tosa::DType)this->attribute->accum_dtype();

1598

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1599

ERROR_IF(in_batch != out_batch, "OpTransposeConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

1600

ERROR_IF(f_in_channels != in_channels, "OpTransposeConv2d: tensor input channel mismatch %d != %d", f_in_channels,

1601

in_channels);

1602

ERROR_IF(f_out_channels != out_channels, "OpTransposeConv2d: tensor output channel mismatch %d != %d",

1603

f_out_channels, out_channels);

1604

ERROR_IF(b_out_channels != out_channels, "OpDepthwiseConv2d: bias channels mismatch %d != %d", b_out_channels,

1605

out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1606

1607

DEBUG_INFO(OP,

1608

"perform OpTransposeConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], "

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1609

"output.shape=[%d,%d,%d,%d], stride=[%d,%d], out_pad=[%d,%d,%d,%d], accum_dtype=%s",

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1610

in_batch, in_height, in_width, in_channels, f_height, f_width, f_out_channels, f_in_channels,

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1611

out_batch, out_height, out_width, out_channels, stride_h, stride_w, out_pad_top,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1612

out_pad_bottom, out_pad_left, out_pad_right, EnumNamesDType()[accum_dtype]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1613

1614

TIn input_val = this->input->getTensor();

1615

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

1616

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1617

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1618

input_val = input_val - (InEigenType)attribute->input_zp();

1619

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1620

}

1621

1622

Eigen::array<Eigen::Index, 4> reshape_dim;

1623

reshape_dim.fill(1);

1624

reshape_dim[3] = b_out_channels;

1625

1626

Eigen::array<Eigen::Index, 4> bcast;

1627

bcast[0] = out_batch;

1628

bcast[1] = out_height;

1629

bcast[2] = out_width;

1630

bcast[3] = 1;

1631

1632

// initialize with bias

1633

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

1634

1635

int out_x_origin, out_y_origin;

1636

int out_x, out_y;

1637

1638

// reference implementation from: tensorflow/tensorflow/lite/kernels/internal/reference/reference_ops.h

1639

for (int ob = 0; ob < out_batch; ob++)

1640

{

1641

for (int ih = 0; ih < in_height; ih++)

1642

{

1643

for (int iw = 0; iw < in_width; iw++)

1644

{

Eric Kunze

c1a9783

2022-07-01 16:56:09 -0700

[diff] [blame]

1645

out_x_origin = iw * stride_w + out_pad_left;

1646

out_y_origin = ih * stride_h + out_pad_top;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1647

for (int ic = 0; ic < in_channels; ic++)

1648

{

1649

for (int fh = 0; fh < f_height; fh++)

1650

{

1651

for (int fw = 0; fw < f_width; fw++)

1652

{

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1653

out_x = out_x_origin + fw;

1654

out_y = out_y_origin + fh;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1655

for (int oc = 0; oc < out_channels; oc++)

1656

{

1657

if ((out_x >= 0 && out_x < out_width) && (out_y >= 0 && out_y < out_height))

1658

{

1659

this->output->getTensor()(ob, out_y, out_x, oc) +=

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1660

(OutEigenType) ((AccEigenType)input_val(ob, ih, iw, ic) *

1661

(AccEigenType)weight_val(oc, fh, fw, ic));

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

}

}

}

}

}

}

}

}

if (AccDtype == DType_INT48)

1672

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1673

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

1674

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1675

}

1676

1677

return GraphNode::eval();

1678

}

1679

1680

// template explicit instantiation

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1681

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, FP16);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1682

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, FLOAT);

Kevin Cheng

3a47857

2021-01-22 17:21:02 -0800

[diff] [blame]

1683

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1684

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, INT16);

1685

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1686

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpAvgPool2d, FP16, FP16);

1687

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpAvgPool2d, FP16, FLOAT);

1688

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpAvgPool2d, FLOAT, FLOAT);

1689

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpAvgPool2d, INT8, INT32);

1690

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpAvgPool2d, INT16, INT32);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1691

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1692

// [in_t, weight_t, acc_t]

1693

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv2d, FP16, FP16, FP16);

1694

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv2d, FP16, FP16, FLOAT);

1695

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv2d, FLOAT, FLOAT, FLOAT);

1696

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv2d, INT8, INT4, INT32);

1697

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv2d, INT8, INT8, INT32);

1698

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv2d, INT16, INT8, INT48);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1699

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1700

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv3d, FP16, FP16, FP16);

1701

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv3d, FP16, FP16, FLOAT);

1702

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv3d, FLOAT, FLOAT, FLOAT);

1703

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv3d, INT8, INT4, INT32);

1704

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv3d, INT8, INT8, INT32);

1705

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpConv3d, INT16, INT8, INT48);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

1706

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1707

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpDepthwiseConv2d, FP16, FP16, FP16);

1708

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpDepthwiseConv2d, FP16, FP16, FLOAT);

1709

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpDepthwiseConv2d, FLOAT, FLOAT, FLOAT);

1710

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpDepthwiseConv2d, INT8, INT4, INT32);

1711

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpDepthwiseConv2d, INT8, INT8, INT32);

1712

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpDepthwiseConv2d, INT16, INT8, INT48);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1713

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1714

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpFullyConnected, FP16, FP16, FP16);

1715

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpFullyConnected, FP16, FP16, FLOAT);

1716

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpFullyConnected, FLOAT, FLOAT, FLOAT);

1717

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpFullyConnected, INT8, INT4, INT32);

1718

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpFullyConnected, INT8, INT8, INT32);

1719

DEF_INSTANTIATE_TWO_TYPE_ONE_ACCUM(OpFullyConnected, INT16, INT8, INT48);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1720

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1721

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpMatMul, INT8, INT32);

1722

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpMatMul, INT16, INT48);

1723

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpMatMul, FP16, FP16);

1724

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpMatMul, FP16, FLOAT);

1725

DEF_INSTANTIATE_ONE_TYPE_ONE_ACCUM(OpMatMul, FLOAT, FLOAT);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1726

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame^]

1727

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, FP16);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1728

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, FLOAT);

Kevin Cheng

3a47857

2021-01-22 17:21:02 -0800

[diff] [blame]

1729

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1730

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, INT16);

1731

James Ward