Blame - reference_model/src/ops/tensor_ops.cc - tosa/reference_model

2020-10-13 16:11:07 -0700

[diff] [blame]

471

{

472

ETensor1<int32_t> result(out_size);

473

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

474

result.setConstant(kernel_size);

475

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

476

// adjust divisors on the left side for padding

477

// We start at the leftmost output element, and remove pad_left - (index * stride) elements

478

// until we have no more padding being used

Eric Kunze

67a9155

2022-02-02 11:27:21 -0800

[diff] [blame]

479

for(int index = 0; (index <= pad_left / stride) && (index < out_size); index++) {

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

480

int32_t adjust = pad_left - (index * stride);

481

result(index) -= adjust;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

482

}

483

Eric Kunze

830add4

2022-01-25 22:56:46 -0800

[diff] [blame]

484

// The process repeats on the right side. Padding starts taking effect as we

485

// near the rightmost input element. The first output element which touches

486

// padding is defined in the initialization of index below. Then we keep moving

487

// to the right, increasing padding until we get to the last output element.

488

int index = std::max(0, ((pad_left + in_size - kernel_size) / stride) + 1);

489

for (; index < out_size; index++) {

490

int32_t adjust = ((index * stride) + kernel_size) - (pad_left + in_size);

491

result(index) -= adjust;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

492

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return result;

}

// assuming input and output tensor have same scales like tflite reference

497

// so no need to scale input and output

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

498

template <DType Dtype, DType AccDtype>

499

int OpAvgPool2d<Dtype, AccDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

500

{

501

int in_batch = this->in->getShape()[0];

502

int in_height = this->in->getShape()[1];

503

int in_width = this->in->getShape()[2];

504

int in_channels = this->in->getShape()[3];

505

506

int out_batch = this->out->getShape()[0];

507

int out_height = this->out->getShape()[1];

508

int out_width = this->out->getShape()[2];

509

int out_channels = this->out->getShape()[3];

510

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

511

ERROR_IF(in_batch != out_batch, "OpAvgPool2d: tensor batch mismatch %d != %d", in_batch, out_batch);

512

ERROR_IF(in_channels != out_channels, "OpAvgPool2d: tensor channel mismatch %d != %d", in_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

513

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

514

int pad_top = this->attribute->pad()[0];

515

int pad_bottom = this->attribute->pad()[1];

516

int pad_left = this->attribute->pad()[2];

517

int pad_right = this->attribute->pad()[3];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

518

int kernel_h = this->attribute->kernel()[0];

519

int kernel_w = this->attribute->kernel()[1];

520

int stride_h = this->attribute->stride()[0];

521

int stride_w = this->attribute->stride()[1];

522

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

523

tosa::DType accum_dtype = (tosa::DType)this->attribute->accum_dtype();

524

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

525

DEBUG_INFO(OP,

526

"perform AvgPool2d, input.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], kernel=[%d,%d], "

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

527

"stride=[%d,%d], pad=[%d,%d,%d,%d], accum_dtype=%s",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

528

in_batch, in_height, in_width, in_channels, out_batch, out_height, out_width, out_channels, kernel_h,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

529

kernel_w, stride_h, stride_w, pad_top, pad_bottom, pad_left, pad_right, EnumNamesDType()[accum_dtype]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

530

531

Eigen::array<Eigen::Index, 2> im2col_input_dims;

532

im2col_input_dims[0] = kernel_h * kernel_w;

533

im2col_input_dims[1] = out_batch * out_height * out_width * out_channels;

534

535

Eigen::array<Eigen::Index, 4> col2im_output_dims;

536

col2im_output_dims[0] = out_batch;

537

col2im_output_dims[1] = out_height;

538

col2im_output_dims[2] = out_width;

539

col2im_output_dims[3] = out_channels;

540

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

541

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

542

pad[0] = std::make_pair(0, 0);

543

pad[1] = std::make_pair(pad_top, pad_bottom);

544

pad[2] = std::make_pair(pad_left, pad_right);

545

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

546

547

ETensor4<InEigenType> input_val = this->in->getTensor();

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

548

if (Dtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

549

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

550

input_val = input_val - (InEigenType)attribute->input_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

551

}

552

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

553

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

554

555

// assuming input and output have same scales

556

// so input and output scaling is not required

557

// TODO: check if this assumption TOSA made

558

559

// extract_image_patches() output [N, KH, KW, H * W, C]

560

// transpose to [KH, KW, N, H * W, C]

561

// reshape to [KH * KW, N * H * W * C]

562

ETensor2<InEigenType> input_extract_patches =

563

input_padded.extract_image_patches(kernel_h, kernel_w, stride_h, stride_w, 1, 1, Eigen::PADDING_VALID)

564

.shuffle(Eigen::array<Eigen::Index, 5>{ 1, 2, 0, 3, 4 })

565

.reshape(im2col_input_dims);

566

567

// 1D result with [N * H * W * C]

568

ETensor1<AccEigenType> out_1d(this->out->getElementCount());

out_1d.setZero();

// sum pool

for (size_t i = 0; i < this->out->getElementCount(); i++)

573

{

574

for (int32_t j = 0; j < kernel_h * kernel_w; j++)

575

{

576

out_1d(i) += (AccEigenType)input_extract_patches(j, i);

}

}

// reshape result to [N, H, W, C] and divide with div_map

581

ETensor4<AccEigenType> sum = out_1d.reshape(col2im_output_dims);

582

583

// calculate 1d height/width div_map (number of elements this pooling window covers)

584

// and outer product to get 2d div_map, then reshape/broadcast to [N, H, W, C]

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

585

ETensor1<int32_t> div_map_h = calculate_div_map_1d(in_height, out_height, kernel_h, stride_h, pad_top, pad_bottom);

586

ETensor1<int32_t> div_map_w = calculate_div_map_1d(in_width, out_width, kernel_w, stride_w, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

587

Eigen::array<Eigen::IndexPair<Eigen::Index>, 1> contract_dims = { Eigen::IndexPair<Eigen::Index>(1, 0) };

588

Eigen::array<Eigen::Index, 4> bcast{ out_batch, 1, 1, out_channels };

589

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

590

ETensor2<int32_t> dm2_w = div_map_w.reshape(Eigen::array<Eigen::Index, 2>{ 1, out_width });

591

ETensor2<int32_t> dm2_h = div_map_h.reshape(Eigen::array<Eigen::Index, 2>{ out_height, 1 });

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

592

ETensor4<int32_t> div_map =

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

593

dm2_h.contract(dm2_w, contract_dims)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

594

.reshape(Eigen::array<Eigen::Index, 4>{ 1, out_height, out_width, 1 })

595

.broadcast(bcast);

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

596

if (Dtype != DType_FP32 && Dtype != DType_FP16 && Dtype != DType_BF16)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

597

{

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

598

try

599

{

600

this->out->getTensor() = sum.binaryExpr(div_map, [](AccEigenType value, int32_t div) -> OutEigenType {

601

int32_t multiplier, shift;

602

TosaReference::QuantUtil::reciprocal_scale(div, multiplier, shift);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

603

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

604

return (OutEigenType)TosaReference::QuantUtil::apply_scale_32(value, multiplier, shift, false);

605

});

606

}

607

catch (std::string desc)

608

{

609

REQUIRE(false, "OpAvgPool2d apply_scale_32() fails: %s.", desc.c_str());

610

}

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

611

this->out->getTensor() = this->out->getTensor() + (OutEigenType)(attribute->output_zp());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

612

this->out->getTensor() = this->out->getTensor().cwiseMax((OutEigenType)QMin);

613

this->out->getTensor() = this->out->getTensor().cwiseMin((OutEigenType)QMax);

614

}

615

else

616

{

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

617

// Case for float-types

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

618

this->out->getTensor() = (sum / div_map.template cast<AccEigenType>()).template cast<OutEigenType>();

619

}

620

621

return GraphNode::eval();

622

}

623

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

624

template <DType InDtype, DType WeightDtype, DType OutDtype>

625

OpConv2d<InDtype, WeightDtype, OutDtype>::OpConv2d(SubgraphTraverser* sgt_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

626

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

627

uint64_t id_)

628

: GraphNode(sgt_, Op_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

629

{

630

setRequiredOperands(3, 1);

631

setRequiredRank(4);

632

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

633

INIT_ATTRIBUTE(Conv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

634

}

635

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

636

template <DType InDtype, DType WeightDtype, DType OutDtype>

637

OpConv2d<InDtype, WeightDtype, OutDtype>::~OpConv2d()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

638

{

639

if (attribute)

640

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

641

}

642

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

643

template <DType InDtype, DType WeightDtype, DType OutDtype>

644

int OpConv2d<InDtype, WeightDtype, OutDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

645

{

646

if (validateRequiredOperands())

647

return 1;

648

649

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

655

if (inputs[2]->getRank() != 1)

656

{

657

printNodeValidationError("OpConv2d: bias tensor must be rank 1");

658

}

659

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

660

ERROR_IF(outputs[0]->getDtype() != OutDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

661

"OpConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

662

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

663

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

664

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

665

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

666

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

667

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

668

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

669

if (check_conv_attribute(attribute, 2 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

670

weight->getShape(), 1 /* offset_kernel */, InDtype, WeightDtype, msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

671

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

672

msg = "OpConv2d: " + msg;

673

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

680

template <DType InDtype, DType WeightDtype, DType OutDtype>

681

int OpConv2d<InDtype, WeightDtype, OutDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

682

{

683

int in_batch = this->input->getShape()[0];

684

int in_height = this->input->getShape()[1];

685

int in_width = this->input->getShape()[2];

686

int in_channels = this->input->getShape()[3];

687

688

int f_out_channels = this->weight->getShape()[0];

689

int f_height = this->weight->getShape()[1];

690

int f_width = this->weight->getShape()[2];

691

int f_in_channels = this->weight->getShape()[3];

692

693

int b_out_channels = this->bias->getShape()[0];

694

695

int out_batch = this->output->getShape()[0];

696

int out_height = this->output->getShape()[1];

697

int out_width = this->output->getShape()[2];

698

int out_channels = this->output->getShape()[3];

699

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

700

ERROR_IF(in_batch != out_batch, "OpConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

701

ERROR_IF(f_in_channels != in_channels, "OpConv2d: tensor input channel mismatch %d != %d", f_in_channels,

702

in_channels);

703

ERROR_IF(f_out_channels != out_channels, "OpConv2d: tensor output channel mismatch %d != %d", f_out_channels,

704

out_channels);

705

ERROR_IF(b_out_channels != out_channels, "OpConv2d: bias channel mismatch %d != %d", b_out_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

706

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

707

int pad_top = this->attribute->pad()[0];

708

int pad_bottom = this->attribute->pad()[1];

709

int pad_left = this->attribute->pad()[2];

710

int pad_right = this->attribute->pad()[3];

711

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

712

int stride_h = this->attribute->stride()[0];

713

int stride_w = this->attribute->stride()[1];

714

int dilation_h = this->attribute->dilation()[0];

715

int dilation_w = this->attribute->dilation()[1];

716

717

DEBUG_INFO(OP,

718

"perform OpConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], "

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

719

"stride=[%d,%d], dilation=[%d,%d], pad=[%d,%d,%d,%d]",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

720

in_batch, in_height, in_width, in_channels, f_height, f_width, f_in_channels, f_out_channels, out_batch,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

721

out_height, out_width, out_channels, stride_h, stride_w, dilation_h, dilation_w, pad_top,

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

722

pad_bottom, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

723

724

// GEMM-conv2d, left matrix is input, right matrix is weight

725

Eigen::array<Eigen::Index, 2> im2col_input_dims;

726

im2col_input_dims[0] = out_batch * out_height * out_width;

727

im2col_input_dims[1] = f_height * f_width * f_in_channels;

728

729

Eigen::array<Eigen::Index, 2> im2col_weight_dims;

730

im2col_weight_dims[0] = f_height * f_width * f_in_channels;

731

im2col_weight_dims[1] = f_out_channels;

732

733

Eigen::array<Eigen::Index, 2> bias_reshaped_dims;

734

bias_reshaped_dims[0] = 1;

735

bias_reshaped_dims[1] = b_out_channels;

736

737

Eigen::array<Eigen::Index, 4> weight_zp_bcast_dims;

738

weight_zp_bcast_dims[0] = f_height;

739

weight_zp_bcast_dims[1] = f_width;

740

weight_zp_bcast_dims[2] = f_in_channels;

741

742

Eigen::array<Eigen::Index, 2> bias_bcast_dims;

743

bias_bcast_dims[0] = out_batch * out_height * out_width;

744

bias_bcast_dims[1] = 1;

745

746

Eigen::array<Eigen::Index, 4> col2im_output_dims;

747

col2im_output_dims[0] = out_batch;

748

col2im_output_dims[1] = out_height;

749

col2im_output_dims[2] = out_width;

750

col2im_output_dims[3] = out_channels;

751

752

Eigen::array<Eigen::IndexPair<Eigen::Index>, 1> contract_dims = { Eigen::IndexPair<Eigen::Index>(1, 0) };

753

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

754

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

755

pad[0] = std::make_pair(0, 0);

756

pad[1] = std::make_pair(pad_top, pad_bottom);

757

pad[2] = std::make_pair(pad_left, pad_right);

758

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

759

760

TIn input_val = this->input->getTensor();

761

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

762

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

763

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

764

input_val = input_val - (InEigenType)attribute->input_zp();

765

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

766

}

767

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

768

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

769

770

// extract_image_patches() output [N, KH, KW, H * W, C]

771

// need to transpose to [N, H * W, KH, KW, C]

772

ETensor5<InEigenType> input_extract_patches =

773

input_padded

774

.extract_image_patches(f_height, f_width, stride_h, stride_w, dilation_h, dilation_w, Eigen::PADDING_VALID)

775

.shuffle(Eigen::array<Eigen::Index, 5>{ 0, 3, 1, 2, 4 });

776

777

// reshape input to [N * H * W, KH * KW * C]

778

ETensor2<InEigenType> im2col_input = input_extract_patches.reshape(im2col_input_dims);

779

780

// transpose and reshape weight from [OC, H, W, IC] to [H * W * IC, OC]

781

ETensor2<WeightEigenType> im2col_weight =

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

782

weight_val.shuffle(Eigen::array<Eigen::Index, 4>({ 1, 2, 3, 0 })).reshape(im2col_weight_dims);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

783

784

// don't need to apply bias_multiplier ( * bias_scale and >> bias_shift) since tflite already scale it

785

// and reshaped from [C] to [1, C], and broadcast to [N * H * W, C]

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

786

ETensor2<OutEigenType> bias_2d = (this->bias->getTensor().reshape(bias_reshaped_dims).broadcast(bias_bcast_dims)).template cast<OutEigenType>();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

787

788

// output matrix is [N * H * W, C]

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

789

ETensor2<OutEigenType> contracted_result =

790

(im2col_input.template cast<AccEigenType>().contract(im2col_weight.template cast<AccEigenType>(), contract_dims)).template cast<OutEigenType>();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

791

792

// adding bias

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

793

ETensor2<OutEigenType> biased_output = contracted_result + bias_2d;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

794

795

// reshape back to [N, H, W, C]

796

this->output->getTensor() = biased_output.reshape(col2im_output_dims);

797

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

798

if (OutDtype == DType_INT48)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

799

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

800

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

801

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

802

}

803

804

return GraphNode::eval();

805

}

806

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

807

template <DType InDtype, DType WeightDtype, DType OutDtype>

808

OpConv3d<InDtype, WeightDtype, OutDtype>::OpConv3d(SubgraphTraverser* sgt_,

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

809

TosaAttributeBase* attribute_,

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

810

uint64_t id_)

811

: GraphNode(sgt_, Op_CONV3D, id_)

812

{

813

setRequiredOperands(3, 1);

814

setRequiredRank(5);

815

816

INIT_ATTRIBUTE(Conv);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

817

}

818

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

819

template <DType InDtype, DType WeightDtype, DType OutDtype>

820

OpConv3d<InDtype, WeightDtype, OutDtype>::~OpConv3d()

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

821

{

822

if (attribute)

823

delete attribute;

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

824

}

825

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

826

template <DType InDtype, DType WeightDtype, DType OutDtype>

827

int OpConv3d<InDtype, WeightDtype, OutDtype>::checkTensorAttributes()

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

828

{

829

if (validateRequiredOperands())

830

return 1;

831

832

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

838

if (inputs[2]->getRank() != 1)

839

{

840

printNodeValidationError("OpConv3d: bias tensor must be rank 1");

841

}

842

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

843

ERROR_IF(outputs[0]->getDtype() != OutDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

844

"OpConv3d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

845

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

846

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

847

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

848

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

849

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

850

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

851

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

852

if (check_conv_attribute(attribute, 3 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

853

weight->getShape(), 1 /* offset_kernel */, InDtype, WeightDtype, msg))

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

854

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

855

msg = "OpConv3d: " + msg;

856

printNodeValidationError(msg.c_str());

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

return 1;

}

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

return 0;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

863

template <DType InDtype, DType WeightDtype, DType OutDtype>

864

int OpConv3d<InDtype, WeightDtype, OutDtype>::eval()

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

865

{

866

int in_batch = this->input->getShape()[0];

867

int in_depth = this->input->getShape()[1];

868

int in_height = this->input->getShape()[2];

869

int in_width = this->input->getShape()[3];

870

int in_channels = this->input->getShape()[4];

871

872

int f_out_channels = this->weight->getShape()[0];

873

int f_depth = this->weight->getShape()[1];

874

int f_height = this->weight->getShape()[2];

875

int f_width = this->weight->getShape()[3];

876

int f_in_channels = this->weight->getShape()[4];

877

878

int b_out_channels = this->bias->getShape()[0];

879

880

int out_batch = this->output->getShape()[0];

881

int out_depth = this->output->getShape()[1];

882

int out_height = this->output->getShape()[2];

883

int out_width = this->output->getShape()[3];

884

int out_channels = this->output->getShape()[4];

885

886

ERROR_IF(in_batch != out_batch, "OpConv3d: tensor batch mismatch %d != %d", in_batch, out_batch);

887

ERROR_IF(f_in_channels != in_channels, "OpConv3d: tensor input channel mismatch %d != %d", f_in_channels,

888

in_channels);

889

ERROR_IF(f_out_channels != out_channels, "OpConv3d: tensor output channel mismatch %d != %d", f_out_channels,

890

out_channels);

891

ERROR_IF(b_out_channels != out_channels, "OpConv3d: bias channel mismatch %d != %d", b_out_channels, out_channels);

892

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

893

int pad_d0 = this->attribute->pad()[0];

894

int pad_d1 = this->attribute->pad()[1];

895

int pad_top = this->attribute->pad()[2];

896

int pad_bottom = this->attribute->pad()[3];

897

int pad_left = this->attribute->pad()[4];

898

int pad_right = this->attribute->pad()[5];

899

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

900

int stride_d = this->attribute->stride()[0];

901

int stride_h = this->attribute->stride()[1];

902

int stride_w = this->attribute->stride()[2];

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

903

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

904

int dilation_d = this->attribute->dilation()[0];

905

int dilation_h = this->attribute->dilation()[1];

906

int dilation_w = this->attribute->dilation()[2];

DEBUG_INFO(

OP,

"perform OpConv3d, input.shape=[%d,%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d,%d], output.shape=[%d,%d,%d,%d,%d], "

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

911

"stride=[%d,%d,%d], dilation=[%d,%d,%d], pad=[%d,%d,%d,%d,%d,%d]",

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

912

in_batch, in_depth, in_height, in_width, in_channels, f_out_channels, f_depth, f_height, f_width, f_in_channels,

913

out_batch, out_depth, out_height, out_width, out_channels, stride_d, stride_h, stride_w, dilation_d, dilation_h,

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

914

dilation_w, pad_d0, pad_d1, pad_top, pad_bottom, pad_left, pad_right);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

915

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

916

Eigen::array<std::pair<int32_t, int32_t>, 5> pad;

917

pad[0] = std::make_pair(0, 0);

918

pad[1] = std::make_pair(pad_d0, pad_d1);

919

pad[2] = std::make_pair(pad_top, pad_bottom);

920

pad[3] = std::make_pair(pad_left, pad_right);

921

pad[4] = std::make_pair(0, 0);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

922

923

TIn input_val = this->input->getTensor();

924

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

925

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

926

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

927

input_val = input_val - (InEigenType)attribute->input_zp();

928

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

929

}

930

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

931

ETensor5<InEigenType> input_padded = input_val.pad(pad);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

932

933

// 1. initialize with bias

934

Eigen::array<Eigen::Index, 5> reshape_dim;

935

reshape_dim.fill(1);

936

reshape_dim[4] = b_out_channels;

937

938

Eigen::array<Eigen::Index, 5> bcast;

939

bcast[0] = out_batch;

940

bcast[1] = out_depth;

941

bcast[2] = out_height;

942

bcast[3] = out_width;

943

bcast[4] = 1;

944

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

945

946

// 2. direct convolution

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

947

AccEigenType acc(0.0);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

948

int d_idx, h_idx, w_idx;

949

950

for (int ob = 0; ob < out_batch; ob++)

951

{

952

for (int od = 0; od < out_depth; od++)

953

{

954

for (int oh = 0; oh < out_height; oh++)

955

{

956

for (int ow = 0; ow < out_width; ow++)

957

{

958

for (int oc = 0; oc < out_channels; oc++)

959

{

Eric Kunze

7edb34c

2022-05-16 17:34:40 -0700

[diff] [blame]

960

// Initialize accumulator with bias value

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

961

acc = (AccEigenType)this->output->getTensor()(ob, od, oh, ow, oc);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

962

for (int fd = 0; fd < f_depth; fd++)

963

{

964

d_idx = od * stride_d + fd * dilation_d;

965

for (int fh = 0; fh < f_height; fh++)

966

{

967

h_idx = oh * stride_h + fh * dilation_h;

968

for (int fw = 0; fw < f_width; fw++)

969

{

970

w_idx = ow * stride_w + fw * dilation_w;

971

for (int ic = 0; ic < in_channels; ic++)

972

{

973

acc += ((AccEigenType)input_padded(ob, d_idx, h_idx, w_idx, ic) *

974

(AccEigenType)weight_val(oc, fd, fh, fw, ic));

}

}

}

}

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

979

this->output->getTensor()(ob, od, oh, ow, oc) = (OutEigenType)acc;

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

}

}

}

}

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

986

if (OutDtype == DType_INT48)

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

987

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

988

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

989

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

990

}

991

992

return GraphNode::eval();

993

}

994

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

995

template <DType InDtype, DType WeightDtype, DType OutDtype>

996

OpDepthwiseConv2d<InDtype, WeightDtype, OutDtype>::OpDepthwiseConv2d(SubgraphTraverser* sgt_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

997

TosaAttributeBase* attribute_,

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

998

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

999

: GraphNode(sgt_, Op_DEPTHWISE_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1000

{

1001

setRequiredOperands(3, 1);

1002

setRequiredRank(4);

1003

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

1004

INIT_ATTRIBUTE(Conv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1005

}

1006

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1007

template <DType InDtype, DType WeightDtype, DType OutDtype>

1008

OpDepthwiseConv2d<InDtype, WeightDtype, OutDtype>::~OpDepthwiseConv2d()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1009

{

1010

if (attribute)

1011

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1012

}

1013

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1014

template <DType InDtype, DType WeightDtype, DType OutDtype>

1015

int OpDepthwiseConv2d<InDtype, WeightDtype, OutDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1016

{

1017

if (validateRequiredOperands())

1018

return 1;

1019

1020

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

// 'bias' checked separatedly since it doens't make sense to make required rank ranging from 1 to 4

1026

if (inputs[2]->getRank() != 1)

1027

{

1028

printNodeValidationError("OpDepthwiseConv2d: bias tensor must be rank 1");

1029

}

1030

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1031

ERROR_IF(outputs[0]->getDtype() != OutDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1032

"OpDepthwiseConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1033

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1034

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1035

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

1036

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1037

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1038

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

1039

std::string msg;

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1040

if (check_conv_attribute(attribute, 2 /* conv_dimension */, input->getShape(), output->getShape(),

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1041

weight->getShape(), 0 /* offset_kernel */, InDtype, WeightDtype, msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1042

{

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

1043

msg = "OpDepthwiseConv2d: " + msg;

1044

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1051

template <DType InDtype, DType WeightDtype, DType OutDtype>

1052

int OpDepthwiseConv2d<InDtype, WeightDtype, OutDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1053

{

1054

int in_batch = this->input->getShape()[0];

1055

int in_height = this->input->getShape()[1];

1056

int in_width = this->input->getShape()[2];

1057

int in_channels = this->input->getShape()[3];

1058

1059

int f_height = this->weight->getShape()[0];

1060

int f_width = this->weight->getShape()[1];

1061

int f_in_channels = this->weight->getShape()[2];

1062

int f_multiplier = this->weight->getShape()[3];

1063

1064

int b_out_channels = this->bias->getShape()[0];

1065

1066

int out_batch = this->output->getShape()[0];

1067

int out_height = this->output->getShape()[1];

1068

int out_width = this->output->getShape()[2];

1069

int out_channels = this->output->getShape()[3];

1070

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1071

ERROR_IF(in_batch != out_batch, "OpDepthwiseConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

1072

ERROR_IF(f_in_channels != in_channels, "OpDepthwiseConv2d: tensor input channel mismatch %d != %d", f_in_channels,

1073

in_channels);

1074

ERROR_IF(in_channels * f_multiplier != out_channels, "OpDepthwiseConv2d: tensor output channel mismatch %d != %d",

1075

in_channels * f_multiplier, out_channels);

1076

ERROR_IF(b_out_channels != out_channels, "OpDepthwiseConv2d: bias channels mismatch %d != %d", b_out_channels,

1077

out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1078

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1079

int pad_top = this->attribute->pad()[0];

1080

int pad_bottom = this->attribute->pad()[1];

1081

int pad_left = this->attribute->pad()[2];

1082

int pad_right = this->attribute->pad()[3];

1083

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1084

int stride_h = this->attribute->stride()[0];

1085

int stride_w = this->attribute->stride()[1];

1086

int dilation_h = this->attribute->dilation()[0];

1087

int dilation_w = this->attribute->dilation()[1];

1088

1089

DEBUG_INFO(OP,

1090

"perform OpDepthwiseConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], "

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1091

"output.shape=[%d,%d,%d,%d], stride=[%d,%d], dilation=[%d,%d], pad=[%d,%d,%d,%d]",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1092

in_batch, in_height, in_width, in_channels, f_height, f_width, f_in_channels, f_multiplier, out_batch,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1093

out_height, out_width, out_channels, stride_h, stride_w, dilation_h, dilation_w, pad_top,

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1094

pad_bottom, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1095

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1096

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

1097

pad[0] = std::make_pair(0, 0);

1098

pad[1] = std::make_pair(pad_top, pad_bottom);

1099

pad[2] = std::make_pair(pad_left, pad_right);

1100

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1101

1102

TIn input_val = this->input->getTensor();

1103

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

1104

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1105

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1106

input_val = input_val - (InEigenType)attribute->input_zp();

1107

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1108

}

1109

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1110

ETensor4<InEigenType> input_padded = input_val.pad(pad);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1111

1112

// GEMM doesn't fit well with DepthwiseConv2d

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1113

// 1. use extract_image_patches() to handle stride/dilation/pad

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1114

// 2. perform direct convolution

1115

1116

// 1. extract_image_patches() output [N, KH, KW, OH * OW, IC]

1117

ETensor5<InEigenType> input_extract_patches = input_padded.extract_image_patches(

1118

f_height, f_width, stride_h, stride_w, dilation_h, dilation_w, Eigen::PADDING_VALID);

1119

1120

Eigen::array<Eigen::Index, 4> reshape_dim;

1121

reshape_dim.fill(1);

1122

reshape_dim[3] = b_out_channels;

1123

1124

Eigen::array<Eigen::Index, 4> bcast;

1125

bcast[0] = out_batch;

1126

bcast[1] = out_height;

1127

bcast[2] = out_width;

1128

bcast[3] = 1;

1129

1130

// initialize with bias

1131

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

1132

1133

// 2. direct depthwise convolution

1134

for (int ob = 0; ob < out_batch; ob++)

1135

{

1136

for (int oh = 0; oh < out_height; oh++)

1137

{

1138

for (int ow = 0; ow < out_width; ow++)

1139

{

1140

for (int ic = 0; ic < in_channels; ic++)

1141

{

1142

for (int cm = 0; cm < f_multiplier; cm++)

1143

{

1144

for (int fh = 0; fh < f_height; fh++)

1145

{

1146

for (int fw = 0; fw < f_width; fw++)

1147

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1148

// Perform multiplication in AccEigenType then cast to OutEigenType

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1149

this->output->getTensor()(ob, oh, ow, ic * f_multiplier + cm) +=

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1150

(OutEigenType)((AccEigenType)input_extract_patches(ob, fh, fw, ow * out_height + oh, ic) *

1151

(AccEigenType)weight_val(fh, fw, ic, cm));

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

}

}

}

}

}

}

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1160

if (OutDtype == DType_INT48)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1161

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1162

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

1163

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1164

}

1165

1166

return GraphNode::eval();

1167

}

1168

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1169

template <DType InDtype, DType WeightDtype, DType OutDtype>

1170

OpFullyConnected<InDtype, WeightDtype, OutDtype>::OpFullyConnected(SubgraphTraverser* sgt_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1171

TosaAttributeBase* attribute_,

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1172

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1173

: GraphNode(sgt_, Op_FULLY_CONNECTED, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1174

{

1175

setRequiredOperands(3, 1);

1176

setRequiredRank(2);

1177

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1178

INIT_ATTRIBUTE(FullyConnected);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1179

}

1180

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1181

template <DType InDtype, DType WeightDtype, DType OutDtype>

1182

OpFullyConnected<InDtype, WeightDtype, OutDtype>::~OpFullyConnected()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1183

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1184

if (attribute)

1185

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1186

}

1187

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1188

template <DType InDtype, DType WeightDtype, DType OutDtype>

1189

int OpFullyConnected<InDtype, WeightDtype, OutDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1190

{

1191

if (validateRequiredOperands())

1192

return 1;

1193

1194

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1200

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

1201

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

1202

1203

if (input->getShape()[1] != weight->getShape()[1])

1204

{

1205

printNodeValidationError("OpFullyConnected operator input.shape[1] should match weight.shape[1]");

return 1;

}

if (weight->getShape()[0] != bias->getShape()[0])

1210

{

1211

printNodeValidationError("OpFullyConnected operator bias.shape[0] should match weight.shape[0]");

return 1;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1215

ERROR_IF(outputs[0]->getDtype() != OutDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1216

"OpFullyConnected: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1217

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1218

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1219

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1220

ERROR_IF(InDtype != DType_INT8 && attribute->input_zp() != 0, "OpFullyConnected: Input zeropoint must be zero for non int8_t data");

1221

ERROR_IF(WeightDtype != DType_INT8 && attribute->weight_zp() != 0, "OpFullyConnected: Weight zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1222

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1226

template <DType InDtype, DType WeightDtype, DType OutDtype>

1227

int OpFullyConnected<InDtype, WeightDtype, OutDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1228

{

1229

typedef Eigen::Tensor<int, 1>::DimensionPair DimPair;

1230

Eigen::array<DimPair, 1> dims{ { DimPair(1, 0) } };

1231

1232

Eigen::array<Eigen::Index, 2> weight_shuffle{ 1, 0 };

1233

1234

Eigen::array<Eigen::Index, 2> bias_reshape;

1235

bias_reshape[0] = 1;

1236

bias_reshape[1] = this->bias->getShape()[0];

1237

1238

Eigen::array<Eigen::Index, 2> bias_bcast;

1239

bias_bcast[0] = this->input->getShape()[0];

1240

bias_bcast[1] = 1;

1241

1242

TIn input_val = this->input->getTensor();

1243

TWeight weight_val = this->weight->getTensor().shuffle(weight_shuffle);

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

1244

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1245

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1246

input_val = input_val - (InEigenType)attribute->input_zp();

1247

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1248

}

1249

1250

this->output->getTensor() =

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1251

input_val.template cast<AccEigenType>().contract(weight_val.template cast<AccEigenType>(), dims).template cast<OutEigenType>() +

1252

this->bias->getTensor().reshape(bias_reshape).broadcast(bias_bcast);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1253

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1254

if (OutDtype == DType_INT48)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1255

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1256

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

1257

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1258

}

1259

return GraphNode::eval();

1260

}

1261

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1262

template <DType Dtype, DType OutDtype>

1263

OpMatMul<Dtype, OutDtype>::OpMatMul(SubgraphTraverser* sgt_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1264

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1265

uint64_t id_)

1266

: GraphNode(sgt_, Op_MATMUL, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1267

{

1268

setRequiredOperands(2, 1);

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1269

setRequiredRank(3);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1270

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1271

INIT_ATTRIBUTE(MatMul);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1272

}

1273

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1274

template <DType Dtype, DType OutDtype>

1275

OpMatMul<Dtype, OutDtype>::~OpMatMul()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1276

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1277

if (attribute)

1278

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1279

}

1280

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1281

template <DType Dtype, DType OutDtype>

1282

int OpMatMul<Dtype, OutDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1283

{

1284

if (validateRequiredOperands())

1285

return 1;

1286

1287

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1292

ERROR_IF(outputs[0]->getDtype() != OutDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1293

"OpMatMul: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1294

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1295

a = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1296

b = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[1]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1297

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1298

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1299

ASSERT_MEM(a && b && output);

// a: [N, H, C]

// b: [N, C, W]

// c: [N, H, W]

// Check N

if (a->getShape()[0] != b->getShape()[0] || a->getShape()[0] != output->getShape()[0])

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1307

{

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1308

printNodeValidationError("OpMatMul operator a.shape[0], b.shape[0] and output.shape[0] should match");

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1309

return 1;

1310

}

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1311

N = a->getShape()[0];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1312

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1313

// Check C

1314

if (a->getShape()[2] != b->getShape()[1])

1315

{

1316

printNodeValidationError("OpMatMul operator a.shape[2] should match b.shape[1]");

1317

return 1;

1318

}

1319

C = a->getShape()[2];

1320

1321

// Check H

1322

if (a->getShape()[1] != output->getShape()[1])

1323

{

1324

printNodeValidationError("OpMatMul operator a.shape[1] should match output.shape[1]");

1325

return 1;

1326

}

1327

H = a->getShape()[1];

1328

1329

// Check W

1330

if (b->getShape()[2] != output->getShape()[2])

1331

{

1332

printNodeValidationError("OpMatMul operator output.shape[2] should match output.shape[2]");

1333

return 1;

1334

}

1335

W = b->getShape()[2];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1336

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1337

ERROR_IF(Dtype != DType_INT8 && attribute->a_zp() != 0, "OpMatMul: A zeropoint must be zero for non int8_t data");

1338

ERROR_IF(Dtype != DType_INT8 && attribute->b_zp() != 0, "OpMatMul: B zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1339

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1343

template <DType Dtype, DType OutDtype>

1344

int OpMatMul<Dtype, OutDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1345

{

1346

typedef Eigen::Tensor<int, 1>::DimensionPair DimPair;

1347

Eigen::array<DimPair, 1> dims{ { DimPair(1, 0) } };

1348

1349

TIn a_val = this->a->getTensor();

1350

TIn b_val = this->b->getTensor();

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1351

if (Dtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1352

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1353

a_val = a_val - (InEigenType)attribute->a_zp();

1354

b_val = b_val - (InEigenType)attribute->b_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1355

}

1356

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1357

Eigen::array<Eigen::Index, 2> a_rank2_shape({ H, C });

1358

Eigen::array<Eigen::Index, 2> b_rank2_shape({ C, W });

1359

Eigen::array<Eigen::Index, 3> output_rank3_shape({ 1, H, W });

1360

1361

Eigen::array<Eigen::Index, 3> a_size_array({ 1, H, C });

1362

Eigen::array<Eigen::Index, 3> b_size_array({ 1, C, W });

1363

1364

Eigen::array<Eigen::Index, 3> a_begin_array({ 0, 0, 0 });

1365

Eigen::array<Eigen::Index, 3> b_begin_array({ 0, 0, 0 });

1366

1367

// Iterate N dimension.

1368

for (int i = 0; i < N; i++)

1369

{

1370

a_begin_array[0] = i;

1371

b_begin_array[0] = i;

1372

1373

TInRank2 a_rank2_val = a_val.slice(a_begin_array, a_size_array).reshape(a_rank2_shape);

1374

TInRank2 b_rank2_val = b_val.slice(b_begin_array, b_size_array).reshape(b_rank2_shape);

1375

TAccRank2 output_rank2_val =

1376

a_rank2_val.template cast<AccEigenType>().contract(b_rank2_val.template cast<AccEigenType>(), dims);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1377

TOut output_rank3_val = output_rank2_val.reshape(output_rank3_shape).template cast<OutEigenType>();

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1378

if (i == 0)

1379

{

1380

this->output->getTensor() = output_rank3_val;

1381

}

1382

else

1383

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1384

TOut temp = this->output->getTensor().concatenate(output_rank3_val, 0);

Kevin Cheng

2021-06-09 14:18:32 -0700

[diff] [blame]

1385

this->output->getTensor() = temp;

1386

}

1387

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1388

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1389

if (OutDtype == DType_INT48)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1390

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1391

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

1392

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1393

}

1394

1395

return GraphNode::eval();

1396

}

1397

1398

template <DType Dtype>

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1399

OpMaxPool2d<Dtype>::OpMaxPool2d(SubgraphTraverser* sgt_,

1400

TosaAttributeBase* attribute_,

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1401

uint64_t id_)

1402

: GraphNode(sgt_, Op_MAX_POOL2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1403

{

1404

setRequiredOperands(1, 1);

1405

setRequiredRank(4);

1406

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

1407

INIT_ATTRIBUTE(Pool);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1408

}

1409

1410

template <DType Dtype>

1411

OpMaxPool2d<Dtype>::~OpMaxPool2d()

{

if (attribute)

delete attribute;

}

template <DType Dtype>

1418

int OpMaxPool2d<Dtype>::checkTensorAttributes()

1419

{

1420

if (validateRequiredOperands())

1421

return 1;

1422

1423

if (validateRequiredRank(inputs[0]) || validateRequiredRank(outputs[0]))

{

return 1;

}

if (inputs[0]->matchType(*outputs[0]))

1429

{

1430

printNodeValidationError("OpMaxPool2d: input and output tensor type mismatch");

return 1;

}

in = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1435

out = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

1436

Kevin Cheng

7eb93d7

2021-10-09 01:26:08 +0000

[diff] [blame]

1437

std::string msg;

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

1438

if (check_pool2d_attribute(attribute, in->getShape(), out->getShape(), msg))

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1439

{

Kevin Cheng

7eb93d7

2021-10-09 01:26:08 +0000

[diff] [blame]

1440

msg = "OpMaxPool2d: " + msg;

1441

printNodeValidationError(msg.c_str());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

return 0;

}

template <DType Dtype>

1449

int OpMaxPool2d<Dtype>::eval()

1450

{

1451

int in_batch = this->in->getShape()[0];

1452

int in_height = this->in->getShape()[1];

1453

int in_width = this->in->getShape()[2];

1454

int in_channels = this->in->getShape()[3];

1455

1456

int out_batch = this->out->getShape()[0];

1457

int out_height = this->out->getShape()[1];

1458

int out_width = this->out->getShape()[2];

1459

int out_channels = this->out->getShape()[3];

1460

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1461

ERROR_IF(in_batch != out_batch, "OpMaxPool2d: tensor batch mismatch %d != %d", in_batch, out_batch);

1462

ERROR_IF(in_channels != out_channels, "OpMaxPool2d: tensor channel mismatch %d != %d", in_channels, out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1463

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1464

int pad_top = this->attribute->pad()[0];

1465

int pad_bottom = this->attribute->pad()[1];

1466

int pad_left = this->attribute->pad()[2];

1467

int pad_right = this->attribute->pad()[3];

1468

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1469

int kernel_h = this->attribute->kernel()[0];

1470

int kernel_w = this->attribute->kernel()[1];

1471

int stride_h = this->attribute->stride()[0];

1472

int stride_w = this->attribute->stride()[1];

1473

1474

DEBUG_INFO(OP,

1475

"perform MaxPool2d, input.shape=[%d,%d,%d,%d], output.shape=[%d,%d,%d,%d], kernel=[%d,%d], "

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1476

"stride=[%d,%d], pad=[%d,%d,%d,%d]",

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1477

in_batch, in_height, in_width, in_channels, out_batch, out_height, out_width, out_channels, kernel_h,

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1478

kernel_w, stride_h, stride_w, pad_top, pad_bottom, pad_left, pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1479

1480

Eigen::array<Eigen::Index, 2> im2col_input_dims;

1481

im2col_input_dims[0] = kernel_h * kernel_w;

1482

im2col_input_dims[1] = out_batch * out_height * out_width * out_channels;

1483

1484

Eigen::array<Eigen::Index, 4> col2im_output_dims;

1485

col2im_output_dims[0] = out_batch;

1486

col2im_output_dims[1] = out_height;

1487

col2im_output_dims[2] = out_width;

1488

col2im_output_dims[3] = out_channels;

1489

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1490

Eigen::array<std::pair<int32_t, int32_t>, 4> pad;

1491

pad[0] = std::make_pair(0, 0);

1492

pad[1] = std::make_pair(pad_top, pad_bottom);

1493

pad[2] = std::make_pair(pad_left, pad_right);

1494

pad[3] = std::make_pair(0, 0);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1495

TatWai Chong

2022-06-06 20:46:01 -0700

[diff] [blame]

1496

ETensor4<InEigenType> input_padded = this->in->getTensor().pad(pad, std::numeric_limits<InEigenType>::lowest());

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1497

1498

// extract_image_patches() output [N, KH, KW, H * W, C]

1499

// transpose to [KH, KW, N, H * W, C]

1500

// reshape to [KH * KW, N * H * W * C]

1501

//

1502

// Set the padding value to be the most negative value that can be

1503

// represented by the datatype to ensure that any padding values will be equal

1504

// to or smaller than the actual maximum in the KH x KW patch.

1505

ETensor2<InEigenType> input_extract_patches =

1506

input_padded

1507

.extract_image_patches(kernel_h, kernel_w, stride_h, stride_w, 1, 1, Eigen::PADDING_VALID,

1508

std::numeric_limits<InEigenType>::lowest())

1509

.shuffle(Eigen::array<Eigen::Index, 5>{ 1, 2, 0, 3, 4 })

1510

.reshape(im2col_input_dims);

1511

1512

// Get the maximum of the KHxHW patches along axis 0

1513

Eigen::Tensor<DenseIndex, 1> tensor_argmax = input_extract_patches.argmax(0);

1514

1515

// 1D result with [N * H * W * C]

1516

ETensor1<OutEigenType> out_1d(this->out->getElementCount());

1517

1518

// index input_patches with argmax array should give the result

1519

for (size_t i = 0; i < this->out->getElementCount(); i++)

1520

{

1521

out_1d(i) = (OutEigenType)input_extract_patches(tensor_argmax(i), i);

1522

}

1523

1524

// reshape result to [N, H, W, C]

1525

this->out->getTensor() = out_1d.reshape(col2im_output_dims);

1526

1527

return GraphNode::eval();

1528

}

1529

Luke Hutton

2023-01-10 14:50:31 +0000

[diff] [blame]

1530

template <DType Dtype>

Luke Hutton

2023-02-06 14:54:18 +0000

[diff] [blame]

1531

OpFFT2d<Dtype>::OpFFT2d(SubgraphTraverser* sgt_,

1532

TosaAttributeBase* attribute_,

1533

uint64_t id_)

1534

: GraphNode(sgt_, Op_FFT2D, id_)

1535

{

1536

setRequiredOperands(2, 2);

setRequiredRank(3);

INIT_ATTRIBUTE(FFT);

}

template <DType Dtype>

1543

OpFFT2d<Dtype>::~OpFFT2d() {

if (attribute)

delete attribute;

}

template <DType Dtype>

1550

int OpFFT2d<Dtype>::checkTensorAttributes()

1551

{

1552

if (validateRequiredOperands())

1553

return 1;

1554

1555

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) ||

1556

validateRequiredRank(outputs[0]) || validateRequiredRank(outputs[1]))

{

return 1;

}

if (inputs[0]->matchType(*outputs[0]) || inputs[1]->matchType(*outputs[1]) ||

1562

inputs[0]->matchType(*inputs[1]))

1563

{

1564

printNodeValidationError("OpFFT2d: input and output tensor type mismatch");

return 1;

}

in_real = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1569

in_imag = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[1]);

1570

out_real = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

1571

out_imag = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[1]);

1572

1573

ASSERT_MEM(in_real && in_imag && out_real && out_imag);

1574

1575

std::string msg;

1576

if (check_fft_shape(in_real->getShape(), in_imag->getShape(),

1577

out_real->getShape(), out_imag->getShape(), msg))

1578

{

1579

msg = "OpFFT2d: " + msg;

1580

printNodeValidationError(msg.c_str());

return 1;

}

return 0;

}

template <DType Dtype>

1588

int OpFFT2d<Dtype>::eval()

1589

{

1590

int in_real_batch = this->in_real->getShape()[0];

1591

int in_real_height = this->in_real->getShape()[1];

1592

int in_real_width = this->in_real->getShape()[2];

1593

1594

int in_imag_batch = this->in_imag->getShape()[0];

1595

int in_imag_height = this->in_imag->getShape()[1];

1596

int in_imag_width = this->in_imag->getShape()[2];

1597

1598

int out_real_batch = this->out_real->getShape()[0];

1599

int out_real_height = this->out_real->getShape()[1];

1600

int out_real_width = this->out_real->getShape()[2];

1601

1602

int out_imag_batch = this->out_imag->getShape()[0];

1603

int out_imag_height = this->out_imag->getShape()[1];

1604

int out_imag_width = this->out_imag->getShape()[2];

1605

1606

DEBUG_INFO(OP,

1607

"perform OpFFT2d, input.shapes=[[%d,%d,%d],[%d,%d,%d]], output.shapes=[[%d,%d,%d],[%d,%d,%d]]",

1608

in_real_batch, in_real_height, in_real_width,

1609

in_imag_batch, in_imag_height, in_imag_width,

1610

out_real_batch, out_real_height, out_real_width,

1611

out_imag_batch, out_imag_height, out_imag_width);

1612

1613

OutEigenType sum_real, sum_imag, a, sign_val = 1.0;

1614

1615

if (attribute->inverse()) {

sign_val = -1.0;

}

for (int n = 0; n < in_real_batch; n++)

1620

{

1621

for (int oy = 0; oy < out_real_height; oy++)

1622

{

1623

for (int ox = 0; ox < out_real_width; ox++)

{

sum_real = 0.0;

sum_imag = 0.0;

for (int iy = 0; iy < in_real_height; iy++)

1628

{

1629

for (int ix = 0; ix < in_real_width; ix++)

1630

{

1631

OutEigenType val_real = this->in_real->getTensor()(n, iy, ix);

1632

OutEigenType val_imag = this->in_imag->getTensor()(n, iy, ix);

1633

// Use explicit cast to ensure intermmediate calculations are completed using OutEigenType

1634

a = sign_val * 2 * M_PI * ((iy * (OutEigenType)oy) / in_real_height + (ix * (OutEigenType)ox) / in_real_width);

1635

sum_real += val_real * cos(a) + val_imag * sin(a);

1636

sum_imag += -val_real * sin(a) + val_imag * cos(a);

1637

}

1638

}

1639

this->out_real->getTensor()(n, oy, ox) = sum_real;

1640

this->out_imag->getTensor()(n, oy, ox) = sum_imag;

}

}

}

return GraphNode::eval();

1646

}

1647

1648

template <DType Dtype>

Luke Hutton

2023-01-10 14:50:31 +0000

[diff] [blame]

1649

OpRFFT2d<Dtype>::OpRFFT2d(SubgraphTraverser* sgt_,

1650

TosaAttributeBase* attribute_,

1651

uint64_t id_)

1652

: GraphNode(sgt_, Op_RFFT2D, id_)

1653

{

1654

setRequiredOperands(1, 2);

setRequiredRank(3);

}

template <DType Dtype>

1659

OpRFFT2d<Dtype>::~OpRFFT2d() {}

1660

1661

1662

template <DType Dtype>

1663

int OpRFFT2d<Dtype>::checkTensorAttributes()

1664

{

1665

if (validateRequiredOperands())

1666

return 1;

1667

1668

if (validateRequiredRank(inputs[0]) || validateRequiredRank(outputs[0]) ||

1669

validateRequiredRank(outputs[1]))

{

return 1;

}

if (inputs[0]->matchType(*outputs[0]) || inputs[0]->matchType(*outputs[1]))

1675

{

1676

printNodeValidationError("OpRFFT2d: input and output tensor type mismatch");

return 1;

}

in = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1681

out_real = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

1682

out_imag = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[1]);

1683

1684

ASSERT_MEM(in && out_real && out_imag);

1685

Luke Hutton

2023-02-06 14:54:18 +0000

[diff] [blame]

1686

std::string msg;

1687

if (check_fft_shape(in->getShape(), {},

1688

out_real->getShape(), out_imag->getShape(), msg))

Luke Hutton

2023-01-10 14:50:31 +0000

[diff] [blame]

1689

{

Luke Hutton

2023-02-06 14:54:18 +0000

[diff] [blame]

1690

msg = "OpRFFT2d: " + msg;

1691

printNodeValidationError(msg.c_str());

Luke Hutton

2023-01-10 14:50:31 +0000

[diff] [blame]

return 1;

}

return 0;

}

template <DType Dtype>

1699

int OpRFFT2d<Dtype>::eval()

1700

{

1701

int32_t in_batch = in->getShape()[0];

1702

int32_t in_height = in->getShape()[1];

1703

int32_t in_width = in->getShape()[2];

1704

1705

int32_t out_real_batch = out_real->getShape()[0];

1706

int32_t out_real_height = out_real->getShape()[1];

1707

int32_t out_real_width = out_real->getShape()[2];

1708

1709

int32_t out_imag_batch = out_imag->getShape()[0];

1710

int32_t out_imag_height = out_imag->getShape()[1];

1711

int32_t out_imag_width = out_imag->getShape()[2];

1712

1713

DEBUG_INFO(OP,

1714

"perform OpRFFT2d, input.shape=[%d,%d,%d], output_real.shape=[%d,%d,%d], "

1715

"output_imag.shape=[%d,%d,%d]",

1716

in_batch, in_height, in_width,

1717

out_real_batch, out_real_height, out_real_width,

1718

out_imag_batch, out_imag_height, out_imag_width);

1719

1720

OutEigenType sum_real, sum_imag, a;

1721

1722

for (int n = 0; n < in_batch; n++)

1723

{

1724

for (int oy = 0; oy < out_real_height; oy++)

1725

{

1726

for (int ox = 0; ox < out_real_width; ox++)

{

sum_real = 0.0;

sum_imag = 0.0;

for (int iy = 0; iy < in_height; iy++)

1731

{

1732

for (int ix = 0; ix < in_width; ix++)

1733

{

1734

// Use explicit cast to ensure intermmediate calculations are completed using OutEigenType

1735

a = 2 * M_PI * ((iy * (OutEigenType)oy) / in_height + (ix * (OutEigenType)ox) / in_width);

1736

sum_real += this->in->getTensor()(n, iy, ix) * cos(a);

1737

sum_imag += -this->in->getTensor()(n, iy, ix) * sin(a);

1738

}

1739

}

1740

this->out_real->getTensor()(n, oy, ox) = sum_real;

1741

this->out_imag->getTensor()(n, oy, ox) = sum_imag;

}

}

}

return GraphNode::eval();

1747

}

1748

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1749

template <DType InDtype, DType WeightDtype, DType OutDtype>

1750

OpTransposeConv2d<InDtype, WeightDtype, OutDtype>::OpTransposeConv2d(SubgraphTraverser* sgt_,

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1751

TosaAttributeBase* attribute_,

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1752

uint64_t id_)

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1753

: GraphNode(sgt_, Op_TRANSPOSE_CONV2D, id_)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1754

{

1755

setRequiredOperands(3, 1);

1756

setRequiredRank(4);

1757

Kevin Cheng

2021-08-31 16:14:03 -0700

[diff] [blame]

1758

INIT_ATTRIBUTE(TransposeConv);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1759

}

1760

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1761

template <DType InDtype, DType WeightDtype, DType OutDtype>

1762

OpTransposeConv2d<InDtype, WeightDtype, OutDtype>::~OpTransposeConv2d()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1763

{

1764

if (attribute)

1765

delete attribute;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1766

}

1767

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1768

template <DType InDtype, DType WeightDtype, DType OutDtype>

1769

int OpTransposeConv2d<InDtype, WeightDtype, OutDtype>::checkTensorAttributes()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1770

{

1771

if (validateRequiredOperands())

1772

return 1;

1773

1774

if (validateRequiredRank(inputs[0]) || validateRequiredRank(inputs[1]) || validateRequiredRank(outputs[0]))

{

return 1;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1779

ERROR_IF(outputs[0]->getDtype() != OutDtype,

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1780

"OpTransposeConv2d: Output data type not supported for this configuration of operator");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1781

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1782

input = dynamic_cast<TosaReference::TensorTemplate<TIn>*>(inputs[0]);

1783

weight = dynamic_cast<TosaReference::TensorTemplate<TWeight>*>(inputs[1]);

1784

bias = dynamic_cast<TosaReference::TensorTemplate<TBias>*>(inputs[2]);

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1785

output = dynamic_cast<TosaReference::TensorTemplate<TOut>*>(outputs[0]);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1786

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1787

if (attribute->out_pad().size() != 4)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1788

{

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1789

printNodeValidationError("OpTransposeConv2d: illegal size for attribute out_pad");

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 1;

}

if (attribute->stride().size() != 2)

1794

{

1795

printNodeValidationError("OpTransposeConv2d: illegal size for attribute stride");

return 1;

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1799

if (attribute->output_shape().size() != 4)

1800

{

1801

printNodeValidationError("OpTransposeConv2d: illegal size for attribute output_shape");

return 1;

}

Eric Kunze

2022-07-01 16:56:09 -0700

[diff] [blame]

1805

Kevin Cheng

2021-11-10 01:04:39 +0000

[diff] [blame]

1806

1807

for (int32_t i : attribute->stride())

{

if (i < 1)

{

printNodeValidationError("OpTransposeConv2d: At least one stride is smaller than one");

return 1;

}

}

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1816

for (int d = 0; d < 4; d++)

1817

{

1818

if (attribute->output_shape()[d] != this->output->getShape()[d])

1819

{

1820

printNodeValidationError("OpTransposeConv2d: illegal size for attribute output_shape");

return 1;

}

}

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1825

int32_t IH = input->getShape()[1];

1826

int32_t IW = input->getShape()[2];

1827

int32_t OH = output->getShape()[1];

1828

int32_t OW = output->getShape()[2];

1829

1830

int32_t stride_y = attribute->stride()[0];

1831

int32_t stride_x = attribute->stride()[1];

1832

int32_t kernel_h = weight->getShape()[1];

1833

int32_t kernel_w = weight->getShape()[2];

1834

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1835

int32_t out_pad_top = attribute->out_pad()[0];

1836

int32_t out_pad_bottom = attribute->out_pad()[1];

1837

int32_t out_pad_left = attribute->out_pad()[2];

1838

int32_t out_pad_right = attribute->out_pad()[3];

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1839

Eric Kunze

c1a9783

2022-07-01 16:56:09 -0700

[diff] [blame]

1840

for (size_t i = 0; i < attribute->out_pad().size(); i++)

1841

{

1842

ERROR_IF(attribute->out_pad()[i] <= -(weight->getShape()[(i / 2) + 1]), "OpTransposeConv2d: At least one out_pad value is larger than kernel size");

1843

}

1844

1845

int32_t H = (IH - 1) * stride_y + out_pad_top + out_pad_bottom + kernel_h;

1846

int32_t W = (IW - 1) * stride_x + out_pad_left + out_pad_right + kernel_w;

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1847

1848

if ((OH != H) || (OW != W))

1849

{

1850

std::string msg = "OpTransposeConv2d: Mismatch between output shape provided and expected output shape (" +

1851

std::to_string(H) + "," +

1852

std::to_string(W) + ")";

1853

printNodeValidationError(msg.c_str());

return 1;

}

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1857

ERROR_IF(InDtype != DType_INT8 && attribute->input_zp() != 0, "OpTransposeConv2d: Input zeropoint must be zero for non int8_t data");

1858

ERROR_IF(WeightDtype != DType_INT8 && attribute->weight_zp() != 0, "OpTransposeConv2d: Weight zeropoint must be zero for non int8_t data");

Kevin Cheng

2021-10-14 17:09:57 -0700

[diff] [blame]

1859

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

return 0;

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1863

template <DType InDtype, DType WeightDtype, DType OutDtype>

1864

int OpTransposeConv2d<InDtype, WeightDtype, OutDtype>::eval()

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1865

{

1866

int in_batch = this->input->getShape()[0];

1867

int in_height = this->input->getShape()[1];

1868

int in_width = this->input->getShape()[2];

1869

int in_channels = this->input->getShape()[3];

1870

1871

int f_out_channels = this->weight->getShape()[0];

1872

int f_height = this->weight->getShape()[1];

1873

int f_width = this->weight->getShape()[2];

1874

int f_in_channels = this->weight->getShape()[3];

1875

1876

int b_out_channels = this->bias->getShape()[0];

1877

1878

int out_batch = this->output->getShape()[0];

1879

int out_height = this->output->getShape()[1];

1880

int out_width = this->output->getShape()[2];

1881

int out_channels = this->output->getShape()[3];

1882

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1883

int out_pad_top = this->attribute->out_pad()[0];

1884

int out_pad_bottom = this->attribute->out_pad()[1];

1885

int out_pad_left = this->attribute->out_pad()[2];

1886

int out_pad_right = this->attribute->out_pad()[3];

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1887

1888

int stride_h = this->attribute->stride()[0];

1889

int stride_w = this->attribute->stride()[1];

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1890

Kevin Cheng

2021-06-29 15:32:19 -0700

[diff] [blame]

1891

ERROR_IF(in_batch != out_batch, "OpTransposeConv2d: tensor batch mismatch %d != %d", in_batch, out_batch);

1892

ERROR_IF(f_in_channels != in_channels, "OpTransposeConv2d: tensor input channel mismatch %d != %d", f_in_channels,

1893

in_channels);

1894

ERROR_IF(f_out_channels != out_channels, "OpTransposeConv2d: tensor output channel mismatch %d != %d",

1895

f_out_channels, out_channels);

1896

ERROR_IF(b_out_channels != out_channels, "OpDepthwiseConv2d: bias channels mismatch %d != %d", b_out_channels,

1897

out_channels);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1898

1899

DEBUG_INFO(OP,

1900

"perform OpTransposeConv2d, input.shape=[%d,%d,%d,%d], weight.shape=[%d,%d,%d,%d], "

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1901

"output.shape=[%d,%d,%d,%d], stride=[%d,%d], out_pad=[%d,%d,%d,%d]",

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1902

in_batch, in_height, in_width, in_channels, f_height, f_width, f_out_channels, f_in_channels,

TatWai Chong

2022-06-08 00:48:04 -0700

[diff] [blame]

1903

out_batch, out_height, out_width, out_channels, stride_h, stride_w, out_pad_top,

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1904

out_pad_bottom, out_pad_left, out_pad_right);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1905

1906

TIn input_val = this->input->getTensor();

1907

TWeight weight_val = this->weight->getTensor();

Eric Kunze

2022-06-17 08:19:12 -0700

[diff] [blame]

1908

if (InDtype == DType_INT8 || WeightDtype == DType_INT8)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1909

{

Eric Kunze

2022-06-07 05:20:44 +0000

[diff] [blame]

1910

input_val = input_val - (InEigenType)attribute->input_zp();

1911

weight_val = weight_val - (WeightEigenType)attribute->weight_zp();

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1912

}

1913

1914

Eigen::array<Eigen::Index, 4> reshape_dim;

1915

reshape_dim.fill(1);

1916

reshape_dim[3] = b_out_channels;

1917

1918

Eigen::array<Eigen::Index, 4> bcast;

1919

bcast[0] = out_batch;

1920

bcast[1] = out_height;

1921

bcast[2] = out_width;

1922

bcast[3] = 1;

1923

1924

// initialize with bias

1925

this->output->getTensor() = this->bias->getTensor().reshape(reshape_dim).broadcast(bcast);

1926

1927

int out_x_origin, out_y_origin;

1928

int out_x, out_y;

1929

1930

// reference implementation from: tensorflow/tensorflow/lite/kernels/internal/reference/reference_ops.h

1931

for (int ob = 0; ob < out_batch; ob++)

1932

{

1933

for (int ih = 0; ih < in_height; ih++)

1934

{

1935

for (int iw = 0; iw < in_width; iw++)

1936

{

Eric Kunze

c1a9783

2022-07-01 16:56:09 -0700

[diff] [blame]

1937

out_x_origin = iw * stride_w + out_pad_left;

1938

out_y_origin = ih * stride_h + out_pad_top;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1939

for (int ic = 0; ic < in_channels; ic++)

1940

{

1941

for (int fh = 0; fh < f_height; fh++)

1942

{

1943

for (int fw = 0; fw < f_width; fw++)

1944

{

Jeremy Johnson

2022-04-26 15:47:21 +0100

[diff] [blame]

1945

out_x = out_x_origin + fw;

1946

out_y = out_y_origin + fh;

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1947

for (int oc = 0; oc < out_channels; oc++)

1948

{

1949

if ((out_x >= 0 && out_x < out_width) && (out_y >= 0 && out_y < out_height))

1950

{

1951

this->output->getTensor()(ob, out_y, out_x, oc) +=

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1952

(OutEigenType) ((AccEigenType)input_val(ob, ih, iw, ic) *

1953

(AccEigenType)weight_val(oc, fh, fw, ic));

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

}

}

}

}

}

}

}

}

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1963

if (OutDtype == DType_INT48)

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1964

{

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1965

this->output->getTensor() = this->output->getTensor().cwiseMax((OutEigenType)AccQMin);

1966

this->output->getTensor() = this->output->getTensor().cwiseMin((OutEigenType)AccQMax);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1967

}

1968

1969

return GraphNode::eval();

1970

}

1971

1972

// template explicit instantiation

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

1973

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, FP16);

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

1974

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, BF16);

Jeremy Johnson

bc2a3db

2022-09-27 13:50:00 +0100

[diff] [blame]

1975

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, FP32);

Kevin Cheng

3a47857

2021-01-22 17:21:02 -0800

[diff] [blame]

1976

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1977

DEF_INSTANTIATE_RANK1_6_ONE_RANK_ONE_TYPE(OpArgMax, INT16);

1978

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1979

DEF_INSTANTIATE_TWO_TYPE(OpAvgPool2d, FP16, FP16);

1980

DEF_INSTANTIATE_TWO_TYPE(OpAvgPool2d, FP16, FP32);

1981

DEF_INSTANTIATE_TWO_TYPE(OpAvgPool2d, BF16, FP32);

1982

DEF_INSTANTIATE_TWO_TYPE(OpAvgPool2d, FP32, FP32);

1983

DEF_INSTANTIATE_TWO_TYPE(OpAvgPool2d, INT8, INT32);

1984

DEF_INSTANTIATE_TWO_TYPE(OpAvgPool2d, INT16, INT32);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1985

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1986

// [in_t, weight_t, out_t]

1987

DEF_INSTANTIATE_THREE_TYPE(OpConv2d, FP16, FP16, FP16);

1988

DEF_INSTANTIATE_THREE_TYPE(OpConv2d, FP16, FP16, FP32);

1989

DEF_INSTANTIATE_THREE_TYPE(OpConv2d, BF16, BF16, FP32);

1990

DEF_INSTANTIATE_THREE_TYPE(OpConv2d, FP32, FP32, FP32);

1991

DEF_INSTANTIATE_THREE_TYPE(OpConv2d, INT8, INT4, INT32);

1992

DEF_INSTANTIATE_THREE_TYPE(OpConv2d, INT8, INT8, INT32);

1993

DEF_INSTANTIATE_THREE_TYPE(OpConv2d, INT16, INT8, INT48);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

1994

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

1995

DEF_INSTANTIATE_THREE_TYPE(OpConv3d, FP16, FP16, FP16);

1996

DEF_INSTANTIATE_THREE_TYPE(OpConv3d, FP16, FP16, FP32);

1997

DEF_INSTANTIATE_THREE_TYPE(OpConv3d, BF16, BF16, FP32);

1998

DEF_INSTANTIATE_THREE_TYPE(OpConv3d, FP32, FP32, FP32);

1999

DEF_INSTANTIATE_THREE_TYPE(OpConv3d, INT8, INT4, INT32);

2000

DEF_INSTANTIATE_THREE_TYPE(OpConv3d, INT8, INT8, INT32);

2001

DEF_INSTANTIATE_THREE_TYPE(OpConv3d, INT16, INT8, INT48);

Kevin Cheng

2021-09-01 12:51:58 -0700

[diff] [blame]

2002

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

2003

DEF_INSTANTIATE_THREE_TYPE(OpDepthwiseConv2d, FP16, FP16, FP16);

2004

DEF_INSTANTIATE_THREE_TYPE(OpDepthwiseConv2d, FP16, FP16, FP32);

2005

DEF_INSTANTIATE_THREE_TYPE(OpDepthwiseConv2d, BF16, BF16, FP32);

2006

DEF_INSTANTIATE_THREE_TYPE(OpDepthwiseConv2d, FP32, FP32, FP32);

2007

DEF_INSTANTIATE_THREE_TYPE(OpDepthwiseConv2d, INT8, INT4, INT32);

2008

DEF_INSTANTIATE_THREE_TYPE(OpDepthwiseConv2d, INT8, INT8, INT32);

2009

DEF_INSTANTIATE_THREE_TYPE(OpDepthwiseConv2d, INT16, INT8, INT48);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

2010

Luke Hutton

2023-02-06 14:54:18 +0000

[diff] [blame]

2011

DEF_INSTANTIATE_ONE_TYPE(OpFFT2d, FP32);

2012

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

2013

DEF_INSTANTIATE_THREE_TYPE(OpFullyConnected, FP16, FP16, FP16);

2014

DEF_INSTANTIATE_THREE_TYPE(OpFullyConnected, FP16, FP16, FP32);

2015

DEF_INSTANTIATE_THREE_TYPE(OpFullyConnected, BF16, BF16, FP32);

2016

DEF_INSTANTIATE_THREE_TYPE(OpFullyConnected, FP32, FP32, FP32);

2017

DEF_INSTANTIATE_THREE_TYPE(OpFullyConnected, INT8, INT4, INT32);

2018

DEF_INSTANTIATE_THREE_TYPE(OpFullyConnected, INT8, INT8, INT32);

2019

DEF_INSTANTIATE_THREE_TYPE(OpFullyConnected, INT16, INT8, INT48);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

2020

James Ward

2023-01-18 14:51:25 +0000

[diff] [blame]

2021

DEF_INSTANTIATE_TWO_TYPE(OpMatMul, INT8, INT32);

2022

DEF_INSTANTIATE_TWO_TYPE(OpMatMul, INT16, INT48);

2023

DEF_INSTANTIATE_TWO_TYPE(OpMatMul, FP16, FP16);

2024

DEF_INSTANTIATE_TWO_TYPE(OpMatMul, FP16, FP32);

2025

DEF_INSTANTIATE_TWO_TYPE(OpMatMul, BF16, FP32);

2026

DEF_INSTANTIATE_TWO_TYPE(OpMatMul, FP32, FP32);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

2027

James Ward

2022-08-12 20:48:56 +0100

[diff] [blame]

2028

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, FP16);

James Ward

2022-10-19 12:20:31 +0100

[diff] [blame]

2029

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, BF16);

Jeremy Johnson

bc2a3db

2022-09-27 13:50:00 +0100

[diff] [blame]

2030

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, FP32);

Kevin Cheng

3a47857

2021-01-22 17:21:02 -0800

[diff] [blame]

2031

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, INT8);

Eric Kunze

2020-10-13 16:11:07 -0700

[diff] [blame]

2032

DEF_INSTANTIATE_ONE_TYPE(OpMaxPool2d, INT16);

2033

Luke Hutton

2023-01-10 14:50:31 +0000

[diff] [blame]

2034

DEF_INSTANTIATE_ONE_TYPE(OpRFFT2d, FP32);

2035

James Ward