Blame - reference_model/src/ops/tensor_ops.cc - tosa/reference_model

2020-10-13 16:11:07 -0700

[diff] [blame]

390

{

391

ETensor1<int32_t> result(out_size);

392

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

393

result.setConstant(kernel_size);

394

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

395

// adjust divisors on the left side for padding

396

// We start at the leftmost output element, and remove pad_left - (index * stride) elements

397

// until we have no more padding being used

Eric Kunze

67a9155

2022-02-02 11:27:21 -0800

[diff] [blame]

398

for(int index = 0; (index <= pad_left / stride) && (index < out_size); index++) {

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

399

int32_t adjust = pad_left - (index * stride);

400

result(index) -= adjust;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

401

}

402

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

403

// The process repeats on the right side. Padding starts taking effect as we

404

// near the rightmost input element. The first output element which touches

405

// padding is defined in the initialization of index below. Then we keep moving

406

// to the right, increasing padding until we get to the last output element.

407

int index = std::max(0, ((pad_left + in_size - kernel_size) / stride) + 1);

408

for (; index < out_size; index++) {

409

int32_t adjust = ((index * stride) + kernel_size) - (pad_left + in_size);

410

result(index) -= adjust;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

411

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return result;

}

// assuming input and output tensor have same scales like tflite reference

416

// so no need to scale input and output

417

template <DType Dtype>

418

int OpAvgPool2d<Dtype>::eval()

419

{

420

int in_batch = this->in->getShape()[0];

421

int in_height = this->in->getShape()[1];

422

int in_width = this->in->getShape()[2];

423

int in_channels = this->in->getShape()[3];

424

425

int out_batch = this->out->getShape()[0];

426

int out_height = this->out->getShape()[1];

427

int out_width = this->out->getShape()[2];

428

int out_channels = this->out->getShape()[3];

429

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

430

ERROR_IF(in_batch != out_batch, "OpAvgPool2d: tensor batch mismatch %d != %d", in_batch, out_batch);

431

ERROR_IF(in_channels != out_channels, "OpAvgPool2d: tensor channel mismatch %d != %d", in_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

432

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

433

int pad_top = this->attribute->pad()[0];

434

int pad_bottom = this->attribute->pad()[1];

435

int pad_left = this->attribute->pad()[2];

436

int pad_right = this->attribute->pad()[3];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

437

int kernel_h = this->attribute->kernel()[0];

438

int kernel_w = this->attribute->kernel()[1];

439

int stride_h = this->attribute->stride()[0];

440

int stride_w = this->attribute->stride()[1];

441

442

DEBUG_INFO(OP,

443

"perform AvgPool2d, input.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], kernel=[%d,%d], "

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

444

"stride=[%d,%d], pad=[%d,%d,%d,%d]",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

445

in_batch, in_height, in_width, in_channels, out_batch, out_height, out_width, out_channels, kernel_h,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

446

kernel_w, stride_h, stride_w, pad_top, pad_bottom, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

447

448

Eigen::array<Eigen::Index, 2> im2col_input_dims;

449

im2col_input_dims[0] = kernel_h * kernel_w;

450

im2col_input_dims[1] = out_batch * out_height * out_width * out_channels;

451

452

Eigen::array<Eigen::Index, 4> col2im_output_dims;

453

col2im_output_dims[0] = out_batch;

454

col2im_output_dims[1] = out_height;

455

col2im_output_dims[2] = out_width;

456

col2im_output_dims[3] = out_channels;

457

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

458

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

459

pad[0] = std::make_pair(0, 0);

460

pad[1] = std::make_pair(pad_top, pad_bottom);

461

pad[2] = std::make_pair(pad_left, pad_right);

462

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

463

464

ETensor4<InEigenType> input_val = this->in->getTensor();

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

465

if (Dtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

466

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

467

input_val = input_val - (InEigenType)attribute->input_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

468

}

469

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

470

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

471

472

// assuming input and output have same scales

473

// so input and output scaling is not required

474

// TODO: check if this assumption TOSA made

475

476

// extract_image_patches() output [N, KH, KW, H * W, C]

477

// transpose to [KH, KW, N, H * W, C]

478

// reshape to [KH * KW, N * H * W * C]

479

ETensor2<InEigenType> input_extract_patches =

480

input_padded.extract_image_patches(kernel_h, kernel_w, stride_h, stride_w, 1, 1, Eigen::PADDING_VALID)

481

.shuffle(Eigen::array<Eigen::Index, 5>{ 1, 2, 0, 3, 4 })

482

.reshape(im2col_input_dims);

483

484

// 1D result with [N * H * W * C]

485

ETensor1<AccEigenType> out_1d(this->out->getElementCount());

out_1d.setZero();

// sum pool

for (size_t i = 0; i < this->out->getElementCount(); i++)

490

{

491

for (int32_t j = 0; j < kernel_h * kernel_w; j++)

492

{

493

out_1d(i) += (AccEigenType)input_extract_patches(j, i);

}

}

// reshape result to [N, H, W, C] and divide with div_map

498

ETensor4<AccEigenType> sum = out_1d.reshape(col2im_output_dims);

499

500

// calculate 1d height/width div_map (number of elements this pooling window covers)

501

// and outer product to get 2d div_map, then reshape/broadcast to [N, H, W, C]

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

502

ETensor1<int32_t> div_map_h = calculate_div_map_1d(in_height, out_height, kernel_h, stride_h, pad_top, pad_bottom);

503

ETensor1<int32_t> div_map_w = calculate_div_map_1d(in_width, out_width, kernel_w, stride_w, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

504

Eigen::array<Eigen::IndexPair<Eigen::Index>, 1> contract_dims = { Eigen::IndexPair<Eigen::Index>(1, 0) };

505

Eigen::array<Eigen::Index, 4> bcast{ out_batch, 1, 1, out_channels };

506

507

ETensor4<int32_t> div_map =

508

div_map_h.reshape(Eigen::array<Eigen::Index, 2>{ out_height, 1 })

509

.contract(div_map_w.reshape(Eigen::array<Eigen::Index, 2>{ 1, out_width }), contract_dims)

510

.reshape(Eigen::array<Eigen::Index, 4>{ 1, out_height, out_width, 1 })

511

.broadcast(bcast);

512

513

if (Dtype != DType_FLOAT)

514

{

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

515

try

516

{

517

this->out->getTensor() = sum.binaryExpr(div_map, [](AccEigenType value, int32_t div) -> OutEigenType {

518

int32_t multiplier, shift;

519

TosaReference::QuantUtil::reciprocal_scale(div, multiplier, shift);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

520

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

521

return (OutEigenType)TosaReference::QuantUtil::apply_scale_32(value, multiplier, shift, false);

522

});

523

}

524

catch (std::string desc)

525

{

526

REQUIRE(false, "OpAvgPool2d apply_scale_32() fails: %s.", desc.c_str());

527

}

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

528

this->out->getTensor() = this->out->getTensor() + (OutEigenType)(attribute->output_zp());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

529

this->out->getTensor() = this->out->getTensor().cwiseMax((OutEigenType)QMin);

530

this->out->getTensor() = this->out->getTensor().cwiseMin((OutEigenType)QMax);

}

else

{

this->out->getTensor() = (sum / div_map.template cast<AccEigenType>()).template cast<OutEigenType>();

535

}

536

537

return GraphNode::eval();

538

}

539

540

template <DType InDtype, DType WeightDtype>

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

541

OpConv2d<InDtype, WeightDtype>::OpConv2d(SubgraphTraverser* sgt_,

542

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

543

uint64_t id_)

544

: GraphNode(sgt_, Op_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

545

{

546

setRequiredOperands(3, 1);

547

setRequiredRank(4);

548

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

549

INIT_ATTRIBUTE(Conv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

550

}

551

552

template <DType InDtype, DType WeightDtype>

553

OpConv2d<InDtype, WeightDtype>::~OpConv2d()

554

{

555

if (attribute)

556

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

557

}

558

559

template <DType InDtype, DType WeightDtype>

560

int OpConv2d<InDtype, WeightDtype>::checkTensorAttributes()

561

{

562

if (validateRequiredOperands())

563

return 1;

564

565

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

571

if (inputs[2]->getRank() != 1)

572

{

573

printNodeValidationError("OpConv2d: bias tensor must be rank 1");

574

}

575

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

576

ERROR_IF(outputs[0]->getDtype() != AccDtype,

Kevin Cheng

2021-11-01 11:14:13 -0700

[diff] [blame]

577

"OpConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

578

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

579

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

580

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

581

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

582

output = dynamic_cast<TosaReference::TensorTemplate<TAcc>*>(outputs[0]);

583

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

584

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

585

if (check_conv_attribute(attribute, 2 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

586

weight->getShape(), 1 /* offset_kernel */, InDtype, WeightDtype, msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

587

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

588

msg = "OpConv2d: " + msg;

589

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

template <DType InDtype, DType WeightDtype>

597

int OpConv2d<InDtype, WeightDtype>::eval()

598

{

599

int in_batch = this->input->getShape()[0];

600

int in_height = this->input->getShape()[1];

601

int in_width = this->input->getShape()[2];

602

int in_channels = this->input->getShape()[3];

603

604

int f_out_channels = this->weight->getShape()[0];

605

int f_height = this->weight->getShape()[1];

606

int f_width = this->weight->getShape()[2];

607

int f_in_channels = this->weight->getShape()[3];

608

609

int b_out_channels = this->bias->getShape()[0];

610

611

int out_batch = this->output->getShape()[0];

612

int out_height = this->output->getShape()[1];

613

int out_width = this->output->getShape()[2];

614

int out_channels = this->output->getShape()[3];

615

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

616

ERROR_IF(in_batch != out_batch, "OpConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

617

ERROR_IF(f_in_channels != in_channels, "OpConv2d: tensor input channel mismatch %d != %d", f_in_channels,

618

in_channels);

619

ERROR_IF(f_out_channels != out_channels, "OpConv2d: tensor output channel mismatch %d != %d", f_out_channels,

620

out_channels);

621

ERROR_IF(b_out_channels != out_channels, "OpConv2d: bias channel mismatch %d != %d", b_out_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

622

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

623

int pad_top = this->attribute->pad()[0];

624

int pad_bottom = this->attribute->pad()[1];

625

int pad_left = this->attribute->pad()[2];

626

int pad_right = this->attribute->pad()[3];

627

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

628

int stride_h = this->attribute->stride()[0];

629

int stride_w = this->attribute->stride()[1];

630

int dilation_h = this->attribute->dilation()[0];

631

int dilation_w = this->attribute->dilation()[1];

632

633

DEBUG_INFO(OP,

634

"perform OpConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], "

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

635

"stride=[%d,%d], dilation=[%d,%d], pad=[%d,%d,%d,%d]",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

636

in_batch, in_height, in_width, in_channels, f_height, f_width, f_in_channels, f_out_channels, out_batch,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

637

out_height, out_width, out_channels, stride_h, stride_w, dilation_h, dilation_w, pad_top,

638

pad_bottom, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

639

640

// GEMM-conv2d, left matrix is input, right matrix is weight

641

Eigen::array<Eigen::Index, 2> im2col_input_dims;

642

im2col_input_dims[0] = out_batch * out_height * out_width;

643

im2col_input_dims[1] = f_height * f_width * f_in_channels;

644

645

Eigen::array<Eigen::Index, 2> im2col_weight_dims;

646

im2col_weight_dims[0] = f_height * f_width * f_in_channels;

647

im2col_weight_dims[1] = f_out_channels;

648

649

Eigen::array<Eigen::Index, 2> bias_reshaped_dims;

650

bias_reshaped_dims[0] = 1;

651

bias_reshaped_dims[1] = b_out_channels;

652

653

Eigen::array<Eigen::Index, 4> weight_zp_bcast_dims;

654

weight_zp_bcast_dims[0] = f_height;

655

weight_zp_bcast_dims[1] = f_width;

656

weight_zp_bcast_dims[2] = f_in_channels;

657

658

Eigen::array<Eigen::Index, 2> bias_bcast_dims;

659

bias_bcast_dims[0] = out_batch * out_height * out_width;

660

bias_bcast_dims[1] = 1;

661

662

Eigen::array<Eigen::Index, 4> col2im_output_dims;

663

col2im_output_dims[0] = out_batch;

664

col2im_output_dims[1] = out_height;

665

col2im_output_dims[2] = out_width;

666

col2im_output_dims[3] = out_channels;

667

668

Eigen::array<Eigen::IndexPair<Eigen::Index>, 1> contract_dims = { Eigen::IndexPair<Eigen::Index>(1, 0) };

669

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

670

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

671

pad[0] = std::make_pair(0, 0);

672

pad[1] = std::make_pair(pad_top, pad_bottom);

673

pad[2] = std::make_pair(pad_left, pad_right);

674

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

675

676

TIn input_val = this->input->getTensor();

677

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame^]

678

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

679

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

680

input_val = input_val - (InEigenType)attribute->input_zp();

681

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

682

}

683

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

684

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

685

686

// extract_image_patches() output [N, KH, KW, H * W, C]

687

// need to transpose to [N, H * W, KH, KW, C]

688

ETensor5<InEigenType> input_extract_patches =

689

input_padded

690

.extract_image_patches(f_height, f_width, stride_h, stride_w, dilation_h, dilation_w, Eigen::PADDING_VALID)

691

.shuffle(Eigen::array<Eigen::Index, 5>{ 0, 3, 1, 2, 4 });

692

693

// reshape input to [N * H * W, KH * KW * C]

694

ETensor2<InEigenType> im2col_input = input_extract_patches.reshape(im2col_input_dims);

695

696

// transpose and reshape weight from [OC, H, W, IC] to [H * W * IC, OC]

697

ETensor2<WeightEigenType> im2col_weight =

698

weight_val.shuffle(Eigen::array<Eigen::Index, 4>({ 1, 2, 3, 0 })).reshape(im2col_weight_dims);

699

700

// don't need to apply bias_multiplier ( * bias_scale and >> bias_shift) since tflite already scale it

701

// and reshaped from [C] to [1, C], and broadcast to [N * H * W, C]

702

ETensor2<AccEigenType> bias_2d = this->bias->getTensor().reshape(bias_reshaped_dims).broadcast(bias_bcast_dims);

703

704

// output matrix is [N * H * W, C]

705

ETensor2<AccEigenType> contracted_result =

706

im2col_input.template cast<AccEigenType>().contract(im2col_weight.template cast<AccEigenType>(), contract_dims);

707

708

// adding bias

709

ETensor2<AccEigenType> biased_output = contracted_result + bias_2d.template cast<AccEigenType>();

710

711

// reshape back to [N, H, W, C]

712

this->output->getTensor() = biased_output.reshape(col2im_output_dims);

713

714

if (AccDtype == DType_INT48)

715

{

716

this->output->getTensor() = this->output->getTensor().cwiseMax((AccEigenType)AccQMin);

717

this->output->getTensor() = this->output->getTensor().cwiseMin((AccEigenType)AccQMax);

718

}

719

720

return GraphNode::eval();

721

}

722

723

template <DType InDtype, DType WeightDtype>

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

724

OpConv3d<InDtype, WeightDtype>::OpConv3d(SubgraphTraverser* sgt_,

725

TosaAttributeBase* attribute_,

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

726

uint64_t id_)

727

: GraphNode(sgt_, Op_CONV3D, id_)

728

{

729

setRequiredOperands(3, 1);

730

setRequiredRank(5);

731

732

INIT_ATTRIBUTE(Conv);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

733

}

734

735

template <DType InDtype, DType WeightDtype>

736

OpConv3d<InDtype, WeightDtype>::~OpConv3d()

737

{

738

if (attribute)

739

delete attribute;

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

740

}

741

742

template <DType InDtype, DType WeightDtype>

743

int OpConv3d<InDtype, WeightDtype>::checkTensorAttributes()

744

{

745

if (validateRequiredOperands())

746

return 1;

747

748

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

754

if (inputs[2]->getRank() != 1)

755

{

756

printNodeValidationError("OpConv3d: bias tensor must be rank 1");

757

}

758

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

759

ERROR_IF(outputs[0]->getDtype() != AccDtype,

Kevin Cheng

2021-11-01 11:14:13 -0700

[diff] [blame]

760

"OpConv3d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

761

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

762

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

763

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

764

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

765

output = dynamic_cast<TosaReference::TensorTemplate<TAcc>*>(outputs[0]);

766

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

767

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

768

if (check_conv_attribute(attribute, 3 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

769

weight->getShape(), 1 /* offset_kernel */, InDtype, WeightDtype, msg))

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

770

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

771

msg = "OpConv3d: " + msg;

772

printNodeValidationError(msg.c_str());

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

return 1;

}

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

return 0;

}

template <DType InDtype, DType WeightDtype>

780

int OpConv3d<InDtype, WeightDtype>::eval()

781

{

782

int in_batch = this->input->getShape()[0];

783

int in_depth = this->input->getShape()[1];

784

int in_height = this->input->getShape()[2];

785

int in_width = this->input->getShape()[3];

786

int in_channels = this->input->getShape()[4];

787

788

int f_out_channels = this->weight->getShape()[0];

789

int f_depth = this->weight->getShape()[1];

790

int f_height = this->weight->getShape()[2];

791

int f_width = this->weight->getShape()[3];

792

int f_in_channels = this->weight->getShape()[4];

793

794

int b_out_channels = this->bias->getShape()[0];

795

796

int out_batch = this->output->getShape()[0];

797

int out_depth = this->output->getShape()[1];

798

int out_height = this->output->getShape()[2];

799

int out_width = this->output->getShape()[3];

800

int out_channels = this->output->getShape()[4];

801

802

ERROR_IF(in_batch != out_batch, "OpConv3d: tensor batch mismatch %d != %d", in_batch, out_batch);

803

ERROR_IF(f_in_channels != in_channels, "OpConv3d: tensor input channel mismatch %d != %d", f_in_channels,

804

in_channels);

805

ERROR_IF(f_out_channels != out_channels, "OpConv3d: tensor output channel mismatch %d != %d", f_out_channels,

806

out_channels);

807

ERROR_IF(b_out_channels != out_channels, "OpConv3d: bias channel mismatch %d != %d", b_out_channels, out_channels);

808

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

809

int pad_d0 = this->attribute->pad()[0];

810

int pad_d1 = this->attribute->pad()[1];

811

int pad_top = this->attribute->pad()[2];

812

int pad_bottom = this->attribute->pad()[3];

813

int pad_left = this->attribute->pad()[4];

814

int pad_right = this->attribute->pad()[5];

815

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

816

int stride_d = this->attribute->stride()[0];

817

int stride_h = this->attribute->stride()[1];

818

int stride_w = this->attribute->stride()[2];

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

819

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

820

int dilation_d = this->attribute->dilation()[0];

821

int dilation_h = this->attribute->dilation()[1];

822

int dilation_w = this->attribute->dilation()[2];

DEBUG_INFO(

OP,

"perform OpConv3d, input.shape=[%d,%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d,%d], output.shape=[%d,%d,%d,%d,%d], "

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

827

"stride=[%d,%d,%d], dilation=[%d,%d,%d], pad=[%d,%d,%d,%d,%d,%d]",

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

828

in_batch, in_depth, in_height, in_width, in_channels, f_out_channels, f_depth, f_height, f_width, f_in_channels,

829

out_batch, out_depth, out_height, out_width, out_channels, stride_d, stride_h, stride_w, dilation_d, dilation_h,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

830

dilation_w, pad_d0, pad_d1, pad_top, pad_bottom, pad_left, pad_right);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

831

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

832

Eigen::array<std::pair<int32_t, int32_t>, 5> pad;

833

pad[0] = std::make_pair(0, 0);

834

pad[1] = std::make_pair(pad_d0, pad_d1);

835

pad[2] = std::make_pair(pad_top, pad_bottom);

836

pad[3] = std::make_pair(pad_left, pad_right);

837

pad[4] = std::make_pair(0, 0);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

838

839

TIn input_val = this->input->getTensor();

840

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame^]

841

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

842

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

843

input_val = input_val - (InEigenType)attribute->input_zp();

844

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

845

}

846

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

847

ETensor5<InEigenType> input_padded = input_val.pad(pad);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

848

849

// 1. initialize with bias

850

Eigen::array<Eigen::Index, 5> reshape_dim;

851

reshape_dim.fill(1);

852

reshape_dim[4] = b_out_channels;

853

854

Eigen::array<Eigen::Index, 5> bcast;

855

bcast[0] = out_batch;

856

bcast[1] = out_depth;

857

bcast[2] = out_height;

858

bcast[3] = out_width;

859

bcast[4] = 1;

860

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

861

862

// 2. direct convolution

863

AccEigenType acc = 0;

864

int d_idx, h_idx, w_idx;

865

866

for (int ob = 0; ob < out_batch; ob++)

867

{

868

for (int od = 0; od < out_depth; od++)

869

{

870

for (int oh = 0; oh < out_height; oh++)

871

{

872

for (int ow = 0; ow < out_width; ow++)

873

{

874

for (int oc = 0; oc < out_channels; oc++)

875

{

Eric Kunze

7edb34c

2022-05-16 17:34:40 -0700

[diff] [blame]

876

// Initialize accumulator with bias value

877

acc = this->output->getTensor()(ob, od, oh, ow, oc);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

878

for (int fd = 0; fd < f_depth; fd++)

879

{

880

d_idx = od * stride_d + fd * dilation_d;

881

for (int fh = 0; fh < f_height; fh++)

882

{

883

h_idx = oh * stride_h + fh * dilation_h;

884

for (int fw = 0; fw < f_width; fw++)

885

{

886

w_idx = ow * stride_w + fw * dilation_w;

887

for (int ic = 0; ic < in_channels; ic++)

888

{

889

acc += ((AccEigenType)input_padded(ob, d_idx, h_idx, w_idx, ic) *

890

(AccEigenType)weight_val(oc, fd, fh, fw, ic));

}

}

}

}

this->output->getTensor()(ob, od, oh, ow, oc) = acc;

}

}

}

}

}

if (AccDtype == DType_INT48)

903

{

904

this->output->getTensor() = this->output->getTensor().cwiseMax((AccEigenType)AccQMin);

905

this->output->getTensor() = this->output->getTensor().cwiseMin((AccEigenType)AccQMax);

906

}

907

908

return GraphNode::eval();

909

}

910

911

template <DType InDtype, DType WeightDtype>

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

912

OpDepthwiseConv2d<InDtype, WeightDtype>::OpDepthwiseConv2d(SubgraphTraverser* sgt_,

913

TosaAttributeBase* attribute_,

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

914

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

915

: GraphNode(sgt_, Op_DEPTHWISE_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

916

{

917

setRequiredOperands(3, 1);

918

setRequiredRank(4);

919

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

920

INIT_ATTRIBUTE(Conv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

921

}

922

923

template <DType InDtype, DType WeightDtype>

924

OpDepthwiseConv2d<InDtype, WeightDtype>::~OpDepthwiseConv2d()

925

{

926

if (attribute)

927

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

928

}

929

930

template <DType InDtype, DType WeightDtype>

931

int OpDepthwiseConv2d<InDtype, WeightDtype>::checkTensorAttributes()

932

{

933

if (validateRequiredOperands())

934

return 1;

935

936

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

942

if (inputs[2]->getRank() != 1)

943

{

944

printNodeValidationError("OpDepthwiseConv2d: bias tensor must be rank 1");

945

}

946

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

947

ERROR_IF(outputs[0]->getDtype() != AccDtype,

Kevin Cheng

2021-11-01 11:14:13 -0700

[diff] [blame]

948

"OpDepthwiseConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

949

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

950

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

951

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

952

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

953

output = dynamic_cast<TosaReference::TensorTemplate<TAcc>*>(outputs[0]);

954

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

955

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

956

if (check_conv_attribute(attribute, 2 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

957

weight->getShape(), 0 /* offset_kernel */, InDtype, WeightDtype, msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

958

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

959

msg = "OpDepthwiseConv2d: " + msg;

960

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

template <DType InDtype, DType WeightDtype>

968

int OpDepthwiseConv2d<InDtype, WeightDtype>::eval()

969

{

970

int in_batch = this->input->getShape()[0];

971

int in_height = this->input->getShape()[1];

972

int in_width = this->input->getShape()[2];

973

int in_channels = this->input->getShape()[3];

974

975

int f_height = this->weight->getShape()[0];

976

int f_width = this->weight->getShape()[1];

977

int f_in_channels = this->weight->getShape()[2];

978

int f_multiplier = this->weight->getShape()[3];

979

980

int b_out_channels = this->bias->getShape()[0];

981

982

int out_batch = this->output->getShape()[0];

983

int out_height = this->output->getShape()[1];

984

int out_width = this->output->getShape()[2];

985

int out_channels = this->output->getShape()[3];

986

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

987

ERROR_IF(in_batch != out_batch, "OpDepthwiseConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

988

ERROR_IF(f_in_channels != in_channels, "OpDepthwiseConv2d: tensor input channel mismatch %d != %d", f_in_channels,

989

in_channels);

990

ERROR_IF(in_channels * f_multiplier != out_channels, "OpDepthwiseConv2d: tensor output channel mismatch %d != %d",

991

in_channels * f_multiplier, out_channels);

992

ERROR_IF(b_out_channels != out_channels, "OpDepthwiseConv2d: bias channels mismatch %d != %d", b_out_channels,

993

out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

994

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

995

int pad_top = this->attribute->pad()[0];

996

int pad_bottom = this->attribute->pad()[1];

997

int pad_left = this->attribute->pad()[2];

998

int pad_right = this->attribute->pad()[3];

999

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1000

int stride_h = this->attribute->stride()[0];

1001

int stride_w = this->attribute->stride()[1];

1002

int dilation_h = this->attribute->dilation()[0];

1003

int dilation_w = this->attribute->dilation()[1];

1004

1005

DEBUG_INFO(OP,

1006

"perform OpDepthwiseConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], "

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1007

"output.shape=[%d,%d,%d,%d], stride=[%d,%d], dilation=[%d,%d], pad=[%d,%d,%d,%d]",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1008

in_batch, in_height, in_width, in_channels, f_height, f_width, f_in_channels, f_multiplier, out_batch,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1009

out_height, out_width, out_channels, stride_h, stride_w, dilation_h, dilation_w, pad_top,

1010

pad_bottom, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1011

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1012

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

1013

pad[0] = std::make_pair(0, 0);

1014

pad[1] = std::make_pair(pad_top, pad_bottom);

1015

pad[2] = std::make_pair(pad_left, pad_right);

1016

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1017

1018

TIn input_val = this->input->getTensor();

1019

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame^]

1020

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1021

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1022

input_val = input_val - (InEigenType)attribute->input_zp();

1023

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1024

}

1025

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1026

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1027

1028

// GEMM doesn't fit well with DepthwiseConv2d

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1029

// 1. use extract_image_patches() to handle stride/dilation/pad

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1030

// 2. perform direct convolution

1031

1032

// 1. extract_image_patches() output [N, KH, KW, OH * OW, IC]

1033

ETensor5<InEigenType> input_extract_patches = input_padded.extract_image_patches(

1034

f_height, f_width, stride_h, stride_w, dilation_h, dilation_w, Eigen::PADDING_VALID);

1035

1036

Eigen::array<Eigen::Index, 4> reshape_dim;

1037

reshape_dim.fill(1);

1038

reshape_dim[3] = b_out_channels;

1039

1040

Eigen::array<Eigen::Index, 4> bcast;

1041

bcast[0] = out_batch;

1042

bcast[1] = out_height;

1043

bcast[2] = out_width;

1044

bcast[3] = 1;

1045

1046

// initialize with bias

1047

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

1048

1049

// 2. direct depthwise convolution

1050

for (int ob = 0; ob < out_batch; ob++)

1051

{

1052

for (int oh = 0; oh < out_height; oh++)

1053

{

1054

for (int ow = 0; ow < out_width; ow++)

1055

{

1056

for (int ic = 0; ic < in_channels; ic++)

1057

{

1058

for (int cm = 0; cm < f_multiplier; cm++)

1059

{

1060

for (int fh = 0; fh < f_height; fh++)

1061

{

1062

for (int fw = 0; fw < f_width; fw++)

1063

{

1064

this->output->getTensor()(ob, oh, ow, ic * f_multiplier + cm) +=

1065

((AccEigenType)input_extract_patches(ob, fh, fw, ow * out_height + oh, ic) *

1066

(AccEigenType)weight_val(fh, fw, ic, cm));

}

}

}

}

}

}

}

if (AccDtype == DType_INT48)

1076

{

1077

this->output->getTensor() = this->output->getTensor().cwiseMax((AccEigenType)AccQMin);

1078

this->output->getTensor() = this->output->getTensor().cwiseMin((AccEigenType)AccQMax);

1079

}

1080

1081

return GraphNode::eval();

1082

}

1083

1084

template <DType InDtype, DType WeightDtype>

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1085

OpFullyConnected<InDtype, WeightDtype>::OpFullyConnected(SubgraphTraverser* sgt_,

1086

TosaAttributeBase* attribute_,

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1087

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1088

: GraphNode(sgt_, Op_FULLY_CONNECTED, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1089

{

1090

setRequiredOperands(3, 1);

1091

setRequiredRank(2);

1092

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1093

INIT_ATTRIBUTE(FullyConnected);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1094

}

1095

1096

template <DType InDtype, DType WeightDtype>

1097

OpFullyConnected<InDtype, WeightDtype>::~OpFullyConnected()

1098

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1099

if (attribute)

1100

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1101

}

1102

1103

template <DType InDtype, DType WeightDtype>

1104

int OpFullyConnected<InDtype, WeightDtype>::checkTensorAttributes()

1105

{

1106

if (validateRequiredOperands())

1107

return 1;

1108

1109

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1115

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

1116

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

1117

1118

if (input->getShape()[1] != weight->getShape()[1])

1119

{

1120

printNodeValidationError("OpFullyConnected operator input.shape[1] should match weight.shape[1]");

return 1;

}

if (weight->getShape()[0] != bias->getShape()[0])

1125

{

1126

printNodeValidationError("OpFullyConnected operator bias.shape[0] should match weight.shape[0]");

return 1;

}

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1130

ERROR_IF(outputs[0]->getDtype() != AccDtype,

1131

"OpFullyConnected: Output data type not supported for this configuration of operator");

1132

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1133

output = dynamic_cast<TosaReference::TensorTemplate<TAcc>*>(outputs[0]);

1134

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1135

ERROR_IF(InDtype != DType_INT8 && attribute->input_zp() != 0, "OpFullyConnected: Input zeropoint must be zero for non int8_t data");

1136

ERROR_IF(WeightDtype != DType_INT8 && attribute->weight_zp() != 0, "OpFullyConnected: Weight zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1137

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

template <DType InDtype, DType WeightDtype>

1142

int OpFullyConnected<InDtype, WeightDtype>::eval()

1143

{

1144

typedef Eigen::Tensor<int, 1>::DimensionPair DimPair;

1145

Eigen::array<DimPair, 1> dims{ { DimPair(1, 0) } };

1146

1147

Eigen::array<Eigen::Index, 2> weight_shuffle{ 1, 0 };

1148

1149

Eigen::array<Eigen::Index, 2> bias_reshape;

1150

bias_reshape[0] = 1;

1151

bias_reshape[1] = this->bias->getShape()[0];

1152

1153

Eigen::array<Eigen::Index, 2> bias_bcast;

1154

bias_bcast[0] = this->input->getShape()[0];

1155

bias_bcast[1] = 1;

1156

1157

TIn input_val = this->input->getTensor();

1158

TWeight weight_val = this->weight->getTensor().shuffle(weight_shuffle);

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame^]

1159

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1160

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1161

input_val = input_val - (InEigenType)attribute->input_zp();

1162

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1163

}

1164

1165

this->output->getTensor() =

1166

input_val.template cast<AccEigenType>().contract(weight_val.template cast<AccEigenType>(), dims) +

1167

this->bias->getTensor().reshape(bias_reshape).broadcast(bias_bcast);

1168

1169

if (AccDtype == DType_INT48)

1170

{

1171

this->output->getTensor() = this->output->getTensor().cwiseMax((AccEigenType)AccQMin);

1172

this->output->getTensor() = this->output->getTensor().cwiseMin((AccEigenType)AccQMax);

1173

}

1174

return GraphNode::eval();

1175

}

1176

1177

template <DType Dtype>

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1178

OpMatMul<Dtype>::OpMatMul(SubgraphTraverser* sgt_,

1179

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1180

uint64_t id_)

1181

: GraphNode(sgt_, Op_MATMUL, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1182

{

1183

setRequiredOperands(2, 1);

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1184

setRequiredRank(3);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1185

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1186

INIT_ATTRIBUTE(MatMul);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1187

}

1188

1189

template <DType Dtype>

1190

OpMatMul<Dtype>::~OpMatMul()

1191

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1192

if (attribute)

1193

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1194

}

1195

1196

template <DType Dtype>

1197

int OpMatMul<Dtype>::checkTensorAttributes()

1198

{

1199

if (validateRequiredOperands())

1200

return 1;

1201

1202

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1207

ERROR_IF(outputs[0]->getDtype() != AccDtype,

Kevin Cheng

2021-11-01 11:14:13 -0700

[diff] [blame]

1208

"OpMatMul: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1209

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1210

a = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1211

b = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[1]);

1212

output = dynamic_cast<TosaReference::TensorTemplate<TAcc>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1213

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1214

ASSERT_MEM(a && b && output);

// a: [N, H, C]

// b: [N, C, W]

// c: [N, H, W]

// Check N

if (a->getShape()[0] != b->getShape()[0] || a->getShape()[0] != output->getShape()[0])

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1222

{

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1223

printNodeValidationError("OpMatMul operator a.shape[0], b.shape[0] and output.shape[0] should match");

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1224

return 1;

1225

}

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1226

N = a->getShape()[0];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1227

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1228

// Check C

1229

if (a->getShape()[2] != b->getShape()[1])

1230

{

1231

printNodeValidationError("OpMatMul operator a.shape[2] should match b.shape[1]");

1232

return 1;

1233

}

1234

C = a->getShape()[2];

1235

1236

// Check H

1237

if (a->getShape()[1] != output->getShape()[1])

1238

{

1239

printNodeValidationError("OpMatMul operator a.shape[1] should match output.shape[1]");

1240

return 1;

1241

}

1242

H = a->getShape()[1];

1243

1244

// Check W

1245

if (b->getShape()[2] != output->getShape()[2])

1246

{

1247

printNodeValidationError("OpMatMul operator output.shape[2] should match output.shape[2]");

1248

return 1;

1249

}

1250

W = b->getShape()[2];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1251

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1252

ERROR_IF(Dtype != DType_INT8 && attribute->a_zp() != 0, "OpMatMul: A zeropoint must be zero for non int8_t data");

1253

ERROR_IF(Dtype != DType_INT8 && attribute->b_zp() != 0, "OpMatMul: B zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1254

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

template <DType Dtype>

1259

int OpMatMul<Dtype>::eval()

1260

{

1261

typedef Eigen::Tensor<int, 1>::DimensionPair DimPair;

1262

Eigen::array<DimPair, 1> dims{ { DimPair(1, 0) } };

1263

1264

TIn a_val = this->a->getTensor();

1265

TIn b_val = this->b->getTensor();

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1266

if (Dtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1267

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1268

a_val = a_val - (InEigenType)attribute->a_zp();

1269

b_val = b_val - (InEigenType)attribute->b_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1270

}

1271

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1272

Eigen::array<Eigen::Index, 2> a_rank2_shape({ H, C });

1273

Eigen::array<Eigen::Index, 2> b_rank2_shape({ C, W });

1274

Eigen::array<Eigen::Index, 3> output_rank3_shape({ 1, H, W });

1275

1276

Eigen::array<Eigen::Index, 3> a_size_array({ 1, H, C });

1277

Eigen::array<Eigen::Index, 3> b_size_array({ 1, C, W });

1278

1279

Eigen::array<Eigen::Index, 3> a_begin_array({ 0, 0, 0 });

1280

Eigen::array<Eigen::Index, 3> b_begin_array({ 0, 0, 0 });

1281

1282

// Iterate N dimension.

1283

for (int i = 0; i < N; i++)

1284

{

1285

a_begin_array[0] = i;

1286

b_begin_array[0] = i;

1287

1288

TInRank2 a_rank2_val = a_val.slice(a_begin_array, a_size_array).reshape(a_rank2_shape);

1289

TInRank2 b_rank2_val = b_val.slice(b_begin_array, b_size_array).reshape(b_rank2_shape);

1290

TAccRank2 output_rank2_val =

1291

a_rank2_val.template cast<AccEigenType>().contract(b_rank2_val.template cast<AccEigenType>(), dims);

1292

TAcc output_rank3_val = output_rank2_val.reshape(output_rank3_shape);

1293

if (i == 0)

1294

{

1295

this->output->getTensor() = output_rank3_val;

}

else

{

TAcc temp = this->output->getTensor().concatenate(output_rank3_val, 0);

1300

this->output->getTensor() = temp;

1301

}

1302

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1303

1304

if (AccDtype == DType_INT48)

1305

{

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1306

this->output->getTensor() = this->output->getTensor().cwiseMax((AccEigenType)AccQMin);

1307

this->output->getTensor() = this->output->getTensor().cwiseMin((AccEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1308

}

1309

1310

return GraphNode::eval();

1311

}

1312

1313

template <DType Dtype>

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1314

OpMaxPool2d<Dtype>::OpMaxPool2d(SubgraphTraverser* sgt_,

1315

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1316

uint64_t id_)

1317

: GraphNode(sgt_, Op_MAX_POOL2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1318

{

1319

setRequiredOperands(1, 1);

1320

setRequiredRank(4);

1321

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

1322

INIT_ATTRIBUTE(Pool);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1323

}

1324

1325

template <DType Dtype>

1326

OpMaxPool2d<Dtype>::~OpMaxPool2d()

{

if (attribute)

delete attribute;

}

template <DType Dtype>

1333

int OpMaxPool2d<Dtype>::checkTensorAttributes()

1334

{

1335

if (validateRequiredOperands())

1336

return 1;

1337

1338

if (validateRequiredRank(inputs[0]) || validateRequiredRank(outputs[0]))

{

return 1;

}

if (inputs[0]->matchType(*outputs[0]))

1344

{

1345

printNodeValidationError("OpMaxPool2d: input and output tensor type mismatch");

return 1;

}

in = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1350

out = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

1351

Kevin Cheng

7eb93d7

2021-10-09 01:26:08 +0000

[diff] [blame]

1352

std::string msg;

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

1353

if (check_pool2d_attribute(attribute, in->getShape(), out->getShape(), msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1354

{

Kevin Cheng

7eb93d7

2021-10-09 01:26:08 +0000

[diff] [blame]

1355

msg = "OpMaxPool2d: " + msg;

1356

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

return 0;

}

template <DType Dtype>

1364

int OpMaxPool2d<Dtype>::eval()

1365

{

1366

int in_batch = this->in->getShape()[0];

1367

int in_height = this->in->getShape()[1];

1368

int in_width = this->in->getShape()[2];

1369

int in_channels = this->in->getShape()[3];

1370

1371

int out_batch = this->out->getShape()[0];

1372

int out_height = this->out->getShape()[1];

1373

int out_width = this->out->getShape()[2];

1374

int out_channels = this->out->getShape()[3];

1375

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1376

ERROR_IF(in_batch != out_batch, "OpMaxPool2d: tensor batch mismatch %d != %d", in_batch, out_batch);

1377

ERROR_IF(in_channels != out_channels, "OpMaxPool2d: tensor channel mismatch %d != %d", in_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1378

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1379

int pad_top = this->attribute->pad()[0];

1380

int pad_bottom = this->attribute->pad()[1];

1381

int pad_left = this->attribute->pad()[2];

1382

int pad_right = this->attribute->pad()[3];

1383

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1384

int kernel_h = this->attribute->kernel()[0];

1385

int kernel_w = this->attribute->kernel()[1];

1386

int stride_h = this->attribute->stride()[0];

1387

int stride_w = this->attribute->stride()[1];

1388

1389

DEBUG_INFO(OP,

1390

"perform MaxPool2d, input.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], kernel=[%d,%d], "

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1391

"stride=[%d,%d], pad=[%d,%d,%d,%d]",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1392

in_batch, in_height, in_width, in_channels, out_batch, out_height, out_width, out_channels, kernel_h,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1393

kernel_w, stride_h, stride_w, pad_top, pad_bottom, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1394

1395

Eigen::array<Eigen::Index, 2> im2col_input_dims;

1396

im2col_input_dims[0] = kernel_h * kernel_w;

1397

im2col_input_dims[1] = out_batch * out_height * out_width * out_channels;

1398

1399

Eigen::array<Eigen::Index, 4> col2im_output_dims;

1400

col2im_output_dims[0] = out_batch;

1401

col2im_output_dims[1] = out_height;

1402

col2im_output_dims[2] = out_width;

1403

col2im_output_dims[3] = out_channels;

1404

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1405

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

1406

pad[0] = std::make_pair(0, 0);

1407

pad[1] = std::make_pair(pad_top, pad_bottom);

1408

pad[2] = std::make_pair(pad_left, pad_right);

1409

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1410

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1411

ETensor4<InEigenType> input_padded = this->in->getTensor().pad(pad, std::numeric_limits<InEigenType>::lowest());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1412

1413

// extract_image_patches() output [N, KH, KW, H * W, C]

1414

// transpose to [KH, KW, N, H * W, C]

1415

// reshape to [KH * KW, N * H * W * C]

1416

//

1417

// Set the padding value to be the most negative value that can be

1418

// represented by the datatype to ensure that any padding values will be equal

1419

// to or smaller than the actual maximum in the KH x KW patch.

1420

ETensor2<InEigenType> input_extract_patches =

1421

input_padded

1422

.extract_image_patches(kernel_h, kernel_w, stride_h, stride_w, 1, 1, Eigen::PADDING_VALID,

1423

std::numeric_limits<InEigenType>::lowest())

1424

.shuffle(Eigen::array<Eigen::Index, 5>{ 1, 2, 0, 3, 4 })

1425

.reshape(im2col_input_dims);

1426

1427

// Get the maximum of the KHxHW patches along axis 0

1428

Eigen::Tensor<DenseIndex, 1> tensor_argmax = input_extract_patches.argmax(0);

1429

1430

// 1D result with [N * H * W * C]

1431

ETensor1<OutEigenType> out_1d(this->out->getElementCount());

1432

1433

// index input_patches with argmax array should give the result

1434

for (size_t i = 0; i < this->out->getElementCount(); i++)

1435

{

1436

out_1d(i) = (OutEigenType)input_extract_patches(tensor_argmax(i), i);

1437

}

1438

1439

// reshape result to [N, H, W, C]

1440

this->out->getTensor() = out_1d.reshape(col2im_output_dims);

1441

1442

return GraphNode::eval();

1443

}

1444

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1445

template <DType InDtype, DType WeightDtype>

1446

OpTransposeConv2d<InDtype, WeightDtype>::OpTransposeConv2d(SubgraphTraverser* sgt_,

1447

TosaAttributeBase* attribute_,

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1448

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1449

: GraphNode(sgt_, Op_TRANSPOSE_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1450

{

1451

setRequiredOperands(3, 1);

1452

setRequiredRank(4);

1453

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

1454

INIT_ATTRIBUTE(TransposeConv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1455

}

1456

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1457

template <DType InDtype, DType WeightDtype>

1458

OpTransposeConv2d<InDtype, WeightDtype>::~OpTransposeConv2d()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1459

{

1460

if (attribute)

1461

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1462

}

1463

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1464

template <DType InDtype, DType WeightDtype>

1465

int OpTransposeConv2d<InDtype, WeightDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1466

{

1467

if (validateRequiredOperands())

1468

return 1;

1469

1470

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1475

ERROR_IF(outputs[0]->getDtype() != AccDtype,

Kevin Cheng

2021-11-01 11:14:13 -0700

[diff] [blame]

1476

"OpTransposeConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1477

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1478

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1479

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

1480

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

1481

output = dynamic_cast<TosaReference::TensorTemplate<TAcc>*>(outputs[0]);

1482

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1483

if (attribute->out_pad().size() != 4)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1484

{

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1485

printNodeValidationError("OpTransposeConv2d: illegal size for attribute out_pad");

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

if (attribute->stride().size() != 2)

1490

{

1491

printNodeValidationError("OpTransposeConv2d: illegal size for attribute stride");

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1495

if (attribute->output_shape().size() != 4)

1496

{

1497

printNodeValidationError("OpTransposeConv2d: illegal size for attribute output_shape");

return 1;

}

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1501

for (int32_t i : attribute->out_pad())

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

{

if (i < 0)

{

printNodeValidationError("OpTransposeConv2d: At least one pad is smaller than zero");

return 1;

}

}

for (int32_t i : attribute->stride())

{

if (i < 1)

{

printNodeValidationError("OpTransposeConv2d: At least one stride is smaller than one");

return 1;

}

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1519

for (int d = 0; d < 4; d++)

1520

{

1521

if (attribute->output_shape()[d] != this->output->getShape()[d])

1522

{

1523

printNodeValidationError("OpTransposeConv2d: illegal size for attribute output_shape");

return 1;

}

}

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1528

int32_t IH = input->getShape()[1];

1529

int32_t IW = input->getShape()[2];

1530

int32_t OH = output->getShape()[1];

1531

int32_t OW = output->getShape()[2];

1532

1533

int32_t stride_y = attribute->stride()[0];

1534

int32_t stride_x = attribute->stride()[1];

1535

int32_t kernel_h = weight->getShape()[1];

1536

int32_t kernel_w = weight->getShape()[2];

1537

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1538

int32_t out_pad_top = attribute->out_pad()[0];

1539

int32_t out_pad_bottom = attribute->out_pad()[1];

1540

int32_t out_pad_left = attribute->out_pad()[2];

1541

int32_t out_pad_right = attribute->out_pad()[3];

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1542

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1543

int32_t H = (IH - 1) * stride_y - out_pad_top - out_pad_bottom + kernel_h;

1544

int32_t W = (IW - 1) * stride_x - out_pad_left - out_pad_right + kernel_w;

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1545

1546

if ((OH != H) || (OW != W))

1547

{

1548

std::string msg = "OpTransposeConv2d: Mismatch between output shape provided and expected output shape (" +

1549

std::to_string(H) + "," +

1550

std::to_string(W) + ")";

1551

printNodeValidationError(msg.c_str());

return 1;

}

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1555

ERROR_IF(InDtype != DType_INT8 && attribute->input_zp() != 0, "OpTransposeConv2d: Input zeropoint must be zero for non int8_t data");

1556

ERROR_IF(WeightDtype != DType_INT8 && attribute->weight_zp() != 0, "OpTransposeConv2d: Weight zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1557

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1561

template <DType InDtype, DType WeightDtype>

1562

int OpTransposeConv2d<InDtype, WeightDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1563

{

1564

int in_batch = this->input->getShape()[0];

1565

int in_height = this->input->getShape()[1];

1566

int in_width = this->input->getShape()[2];

1567

int in_channels = this->input->getShape()[3];

1568

1569

int f_out_channels = this->weight->getShape()[0];

1570

int f_height = this->weight->getShape()[1];

1571

int f_width = this->weight->getShape()[2];

1572

int f_in_channels = this->weight->getShape()[3];

1573

1574

int b_out_channels = this->bias->getShape()[0];

1575

1576

int out_batch = this->output->getShape()[0];

1577

int out_height = this->output->getShape()[1];

1578

int out_width = this->output->getShape()[2];

1579

int out_channels = this->output->getShape()[3];

1580

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1581

int out_pad_top = this->attribute->out_pad()[0];

1582

int out_pad_bottom = this->attribute->out_pad()[1];

1583

int out_pad_left = this->attribute->out_pad()[2];

1584

int out_pad_right = this->attribute->out_pad()[3];

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1585

1586

int stride_h = this->attribute->stride()[0];

1587

int stride_w = this->attribute->stride()[1];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1588

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1589

ERROR_IF(in_batch != out_batch, "OpTransposeConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

1590

ERROR_IF(f_in_channels != in_channels, "OpTransposeConv2d: tensor input channel mismatch %d != %d", f_in_channels,

1591

in_channels);

1592

ERROR_IF(f_out_channels != out_channels, "OpTransposeConv2d: tensor output channel mismatch %d != %d",

1593

f_out_channels, out_channels);

1594

ERROR_IF(b_out_channels != out_channels, "OpDepthwiseConv2d: bias channels mismatch %d != %d", b_out_channels,

1595

out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1596

1597

DEBUG_INFO(OP,

1598

"perform OpTransposeConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], "

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1599

"output.shape=[%d,%d,%d,%d], stride=[%d,%d], out_pad=[%d,%d,%d,%d]",

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1600

in_batch, in_height, in_width, in_channels, f_height, f_width, f_out_channels, f_in_channels,

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1601

out_batch, out_height, out_width, out_channels, stride_h, stride_w, out_pad_top,

1602

out_pad_bottom, out_pad_left, out_pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1603

1604

TIn input_val = this->input->getTensor();

1605

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame^]

1606

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1607

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1608

input_val = input_val - (InEigenType)attribute->input_zp();

1609

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1610

}

1611

1612

Eigen::array<Eigen::Index, 4> reshape_dim;

1613

reshape_dim.fill(1);

1614

reshape_dim[3] = b_out_channels;

1615

1616

Eigen::array<Eigen::Index, 4> bcast;

1617

bcast[0] = out_batch;

1618

bcast[1] = out_height;

1619

bcast[2] = out_width;

1620

bcast[3] = 1;

1621

1622

// initialize with bias

1623

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

1624

1625

int out_x_origin, out_y_origin;

1626

int out_x, out_y;

1627

1628

// reference implementation from: tensorflow/tensorflow/lite/kernels/internal/reference/reference_ops.h

1629

for (int ob = 0; ob < out_batch; ob++)

1630

{

1631

for (int ih = 0; ih < in_height; ih++)

1632

{

1633

for (int iw = 0; iw < in_width; iw++)

1634

{

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1635

out_x_origin = iw * stride_w - out_pad_left;

1636

out_y_origin = ih * stride_h - out_pad_top;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1637

for (int ic = 0; ic < in_channels; ic++)

1638

{

1639

for (int fh = 0; fh < f_height; fh++)

1640

{

1641

for (int fw = 0; fw < f_width; fw++)

1642

{

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1643

out_x = out_x_origin + fw;

1644

out_y = out_y_origin + fh;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1645

for (int oc = 0; oc < out_channels; oc++)

1646

{

1647

if ((out_x >= 0 && out_x < out_width) && (out_y >= 0 && out_y < out_height))

1648

{

1649

this->output->getTensor()(ob, out_y, out_x, oc) +=

1650

((AccEigenType)input_val(ob, ih, iw, ic) *

1651

(AccEigenType)weight_val(oc, fh, fw, ic));

}

}

}

}

}

}

}

}

if (AccDtype == DType_INT48)

1662

{

1663

this->output->getTensor() = this->output->getTensor().cwiseMax((AccEigenType)AccQMin);

1664

this->output->getTensor() = this->output->getTensor().cwiseMin((AccEigenType)AccQMax);

1665

}

1666

1667

return GraphNode::eval();

1668

}

1669

1670

// template explicit instantiation

1671

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, FLOAT);

Kevin Cheng

2021-01-22 17:21:02 -0800

[diff] [blame]

1672

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1673

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, INT16);

1674

1675

DEF_INSTANTIATE_ONE_TYPE(OpAvgPool2d, FLOAT)

Kevin Cheng

2021-01-22 17:21:02 -0800

[diff] [blame]

1676

DEF_INSTANTIATE_ONE_TYPE(OpAvgPool2d, INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1677

DEF_INSTANTIATE_ONE_TYPE(OpAvgPool2d, INT16)

1678

1679

DEF_INSTANTIATE_TWO_TYPE(OpConv2d, FLOAT, FLOAT);

Kevin Cheng

2021-01-22 17:21:02 -0800

[diff] [blame]

1680

DEF_INSTANTIATE_TWO_TYPE(OpConv2d, INT8, INT4);

1681

DEF_INSTANTIATE_TWO_TYPE(OpConv2d, INT8, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1682

DEF_INSTANTIATE_TWO_TYPE(OpConv2d, INT16, INT8);

1683

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

1684

DEF_INSTANTIATE_TWO_TYPE(OpConv3d, FLOAT, FLOAT);

1685

DEF_INSTANTIATE_TWO_TYPE(OpConv3d, INT8, INT4);

1686

DEF_INSTANTIATE_TWO_TYPE(OpConv3d, INT8, INT8);

1687

DEF_INSTANTIATE_TWO_TYPE(OpConv3d, INT16, INT8);

1688

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1689

DEF_INSTANTIATE_TWO_TYPE(OpDepthwiseConv2d, FLOAT, FLOAT);

Kevin Cheng

2021-01-22 17:21:02 -0800

[diff] [blame]

1690

DEF_INSTANTIATE_TWO_TYPE(OpDepthwiseConv2d, INT8, INT4);

1691

DEF_INSTANTIATE_TWO_TYPE(OpDepthwiseConv2d, INT8, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1692

DEF_INSTANTIATE_TWO_TYPE(OpDepthwiseConv2d, INT16, INT8);

1693

1694

DEF_INSTANTIATE_TWO_TYPE(OpFullyConnected, FLOAT, FLOAT);

Kevin Cheng

2021-01-22 17:21:02 -0800

[diff] [blame]

1695

DEF_INSTANTIATE_TWO_TYPE(OpFullyConnected, INT8, INT4);

1696

DEF_INSTANTIATE_TWO_TYPE(OpFullyConnected, INT8, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1697

DEF_INSTANTIATE_TWO_TYPE(OpFullyConnected, INT16, INT8);

1698

Kevin Cheng

2021-01-22 17:21:02 -0800

[diff] [blame]

1699

DEF_INSTANTIATE_ONE_TYPE(OpMatMul, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1700

DEF_INSTANTIATE_ONE_TYPE(OpMatMul, INT16);

1701

DEF_INSTANTIATE_ONE_TYPE(OpMatMul, FLOAT);

1702

1703

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, FLOAT);

Kevin Cheng

2021-01-22 17:21:02 -0800

[diff] [blame]

1704

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1705

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, INT16);

1706

1707

DEF_INSTANTIATE_TWO_TYPE(OpTransposeConv2d, FLOAT, FLOAT);

Kevin Cheng

2021-01-22 17:21:02 -0800

[diff] [blame]

1708

DEF_INSTANTIATE_TWO_TYPE(OpTransposeConv2d, INT8, INT4);

1709

DEF_INSTANTIATE_TWO_TYPE(OpTransposeConv2d, INT8, INT8);

Eric Kunze