Blame - src/core/NEON/kernels/NEReductionOperationKernel.cpp - ml/ComputeLibrary

2020-01-28 10:38:07 +0000

[diff] [blame]

1586

return Reducer<RedOpX_quantized<uint8_t>>::reduceX(window, input, output, RedOpX_quantized<uint8_t>(), op);

1587

case DataType::QASYMM8_SIGNED:

1588

return Reducer<RedOpX_quantized<int8_t>>::reduceX(window, input, output, RedOpX_quantized<int8_t>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1589

#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC

1590

case DataType::F16:

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1591

return Reducer<RedOpX<float16_t, 8>>::reduceX(window, input, output, RedOpX<float16_t, 8>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1592

#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC

1593

case DataType::F32:

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1594

return Reducer<RedOpX<float, 4>>::reduceX(window, input, output, RedOpX<float, 4>(), op);

Michalis Spyrou

2019-05-13 17:41:01 +0100

[diff] [blame]

1595

case DataType::S32:

1596

return Reducer<RedOpX<int32_t, 4>>::reduceX(window, input, output, RedOpX<int32_t, 4>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1597

default:

1598

ARM_COMPUTE_ERROR("Not supported");

1599

}

1600

case 1:

1601

switch(input->info()->data_type())

1602

{

1603

case DataType::QASYMM8:

Luca Foschiani

2020-01-28 10:38:07 +0000

[diff] [blame]

1604

return Reducer<RedOpYZW_quantized<uint8_t>>::reduceY(window, input, output, RedOpYZW_quantized<uint8_t>(), op);

1605

case DataType::QASYMM8_SIGNED:

1606

return Reducer<RedOpYZW_quantized<int8_t>>::reduceY(window, input, output, RedOpYZW_quantized<int8_t>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1607

#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC

1608

case DataType::F16:

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1609

return Reducer<RedOpYZW<float16_t, 8>>::reduceY(window, input, output, RedOpYZW<float16_t, 8>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1610

#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC

1611

case DataType::F32:

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1612

return Reducer<RedOpYZW<float, 4>>::reduceY(window, input, output, RedOpYZW<float, 4>(), op);

Michalis Spyrou

2019-05-13 17:41:01 +0100

[diff] [blame]

1613

case DataType::S32:

1614

return Reducer<RedOpYZW<int32_t, 4>>::reduceY(window, input, output, RedOpYZW<int32_t, 4>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1615

default:

1616

ARM_COMPUTE_ERROR("Not supported");

1617

}

1618

case 2:

1619

switch(input->info()->data_type())

1620

{

1621

case DataType::QASYMM8:

Luca Foschiani

2020-01-28 10:38:07 +0000

[diff] [blame]

1622

return Reducer<RedOpYZW_quantized<uint8_t>>::reduceZ(window, input, output, RedOpYZW_quantized<uint8_t>(), op);

1623

case DataType::QASYMM8_SIGNED:

1624

return Reducer<RedOpYZW_quantized<int8_t>>::reduceZ(window, input, output, RedOpYZW_quantized<int8_t>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1625

#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC

1626

case DataType::F16:

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1627

return Reducer<RedOpYZW<float16_t, 8>>::reduceZ(window, input, output, RedOpYZW<float16_t, 8>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1628

#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC

1629

case DataType::F32:

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1630

return Reducer<RedOpYZW<float, 4>>::reduceZ(window, input, output, RedOpYZW<float, 4>(), op);

Michalis Spyrou

2019-05-13 17:41:01 +0100

[diff] [blame]

1631

case DataType::S32:

1632

return Reducer<RedOpYZW<int32_t, 4>>::reduceZ(window, input, output, RedOpYZW<int32_t, 4>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1633

default:

1634

ARM_COMPUTE_ERROR("Not supported");

1635

}

1636

case 3:

1637

switch(input->info()->data_type())

1638

{

1639

case DataType::QASYMM8:

Luca Foschiani

2020-01-28 10:38:07 +0000

[diff] [blame]

1640

return Reducer<RedOpYZW_quantized<uint8_t>>::reduceW(window, input, output, RedOpYZW_quantized<uint8_t>(), op);

1641

case DataType::QASYMM8_SIGNED:

1642

return Reducer<RedOpYZW_quantized<int8_t>>::reduceW(window, input, output, RedOpYZW_quantized<int8_t>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1643

#ifdef __ARM_FEATURE_FP16_VECTOR_ARITHMETIC

1644

case DataType::F16:

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1645

return Reducer<RedOpYZW<float16_t, 8>>::reduceW(window, input, output, RedOpYZW<float16_t, 8>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1646

#endif // __ARM_FEATURE_FP16_VECTOR_ARITHMETIC

1647

case DataType::F32:

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1648

return Reducer<RedOpYZW<float, 4>>::reduceW(window, input, output, RedOpYZW<float, 4>(), op);

Michalis Spyrou

2019-05-13 17:41:01 +0100

[diff] [blame]

1649

case DataType::S32:

1650

return Reducer<RedOpYZW<int32_t, 4>>::reduceW(window, input, output, RedOpYZW<int32_t, 4>(), op);

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1651

default:

1652

ARM_COMPUTE_ERROR("Not supported");

1653

}

1654

default:

1655

ARM_COMPUTE_ERROR("Unsupported reduction axis");

1656

}

1657

}

John Richardson

2018-05-08 14:34:33 +0100

[diff] [blame]

1658

1659

Status validate_arguments(const ITensorInfo *input, const ITensorInfo *output, unsigned int axis, ReductionOperation op)

1660

{

1661

ARM_COMPUTE_UNUSED(op);

1662

1663

ARM_COMPUTE_RETURN_ERROR_ON_NULLPTR(input, output);

Georgios Pinitas

8f5802f

2019-02-22 11:08:32 +0000

[diff] [blame]

1664

ARM_COMPUTE_RETURN_ERROR_ON_CPU_F16_UNSUPPORTED(input);

giuros01

154bc1c

2019-03-26 17:44:40 +0000

[diff] [blame]

1665

1666

if(input->num_channels() == 1)

1667

{

Luca Foschiani

2020-01-28 10:38:07 +0000

[diff] [blame]

1668

ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(input, 1, DataType::QASYMM8_SIGNED, DataType::QASYMM8, DataType::S32, DataType::F16, DataType::F32);

giuros01

154bc1c

2019-03-26 17:44:40 +0000

[diff] [blame]

}

else

{

ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(input, 2, DataType::F32);

1673

ARM_COMPUTE_RETURN_ERROR_ON(op != ReductionOperation::SUM);

1674

ARM_COMPUTE_RETURN_ERROR_ON(axis != 2);

1675

}

John Richardson

2018-05-08 14:34:33 +0100

[diff] [blame]

1676

1677

ARM_COMPUTE_RETURN_ERROR_ON_MSG(axis >= TensorShape::num_max_dimensions, "Reduction axis greater than max number of dimensions");

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1678

ARM_COMPUTE_RETURN_ERROR_ON_MSG(axis > 3, "Unsupported reduction axis");

John Richardson

2018-05-08 14:34:33 +0100

[diff] [blame]

1679

1680

if(output->total_size() != 0)

1681

{

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1682

bool is_arg_min_max = (op == ReductionOperation::ARG_IDX_MAX || op == ReductionOperation::ARG_IDX_MIN);

1683

if(!is_arg_min_max)

1684

{

1685

ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_DATA_TYPES(input, output);

Isabella Gottardi

0a1090a

2019-02-14 18:07:36 +0000

[diff] [blame]

1686

ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_QUANTIZATION_INFO(input, output);

giuros01

154bc1c

2019-03-26 17:44:40 +0000

[diff] [blame]

1687

ARM_COMPUTE_RETURN_ERROR_ON(input->num_channels() != output->num_channels());

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1688

}

1689

else

1690

{

Michele Di Giorgio

9637b2e

2019-09-23 16:49:49 +0100

[diff] [blame]

1691

ARM_COMPUTE_RETURN_ERROR_ON_DATA_TYPE_CHANNEL_NOT_IN(output, 1, DataType::U32, DataType::S32);

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1692

}

John Richardson

2018-05-08 14:34:33 +0100

[diff] [blame]

1693

Michalis Spyrou

2019-01-03 11:10:25 +0000

[diff] [blame]

1694

const TensorShape output_shape = arm_compute::misc::shape_calculator::compute_reduced_shape(input->tensor_shape(), axis);

John Richardson

2018-05-08 14:34:33 +0100

[diff] [blame]

1695

const TensorInfo tensor_info_reshaped = input->clone()->set_tensor_shape(output_shape);

1696

ARM_COMPUTE_RETURN_ERROR_ON_MISMATCHING_SHAPES(output, &tensor_info_reshaped);

}

return Status{};

}

Georgios Pinitas

2017-08-03 10:19:40 +0100

[diff] [blame]

1701

} // namespace

1702

1703

NEReductionOperationKernel::NEReductionOperationKernel()

Sheri Zhang

4d91dc6

2020-09-23 11:22:50 +0100

[diff] [blame]

1704

: _input(nullptr), _output(nullptr), _reduction_axis(0), _op(ReductionOperation::SUM_SQUARE)

Georgios Pinitas

2017-08-03 10:19:40 +0100

[diff] [blame]

{

}

Georgios Pinitas

2017-08-03 10:19:40 +0100

[diff] [blame]

1708

void NEReductionOperationKernel::configure(const ITensor *input, ITensor *output, unsigned int axis, ReductionOperation op)

1709

{

1710

ARM_COMPUTE_ERROR_ON_NULLPTR(input, output);

Georgios Pinitas

2017-08-03 10:19:40 +0100

[diff] [blame]

1711

John Richardson

2018-05-08 14:34:33 +0100

[diff] [blame]

1712

ARM_COMPUTE_ERROR_THROW_ON(validate_arguments(input->info(), output->info(), axis, op));

Georgios Pinitas

2017-08-03 10:19:40 +0100

[diff] [blame]

1713

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1714

_input = input;

1715

_output = output;

Michalis Spyrou

2018-10-12 10:51:31 +0100

[diff] [blame]

1716

_op = op;

1717

_reduction_axis = axis;

Georgios Pinitas

2017-08-03 10:19:40 +0100

[diff] [blame]

1718

1719

// Configure kernel window

Georgios Pinitas

412b789

2020-11-11 21:05:24 +0000

[diff] [blame]

1720

Window win = calculate_max_window(*input->info(), Steps());

Sheri Zhang

4d91dc6

2020-09-23 11:22:50 +0100

[diff] [blame]

1721

INEKernel::configure(win);

Georgios Pinitas

2017-08-03 10:19:40 +0100

[diff] [blame]

1722

Sheri Zhang

4d91dc6

2020-09-23 11:22:50 +0100

[diff] [blame]

1723

// Calculate output shape and set if empty

1724

const TensorShape output_shape = arm_compute::misc::shape_calculator::compute_reduced_shape(input->info()->tensor_shape(), axis);

1725

// Output auto initialization if not yet initialized

1726

const bool is_arg_min_max = (op == ReductionOperation::ARG_IDX_MIN || op == ReductionOperation::ARG_IDX_MAX);

1727

DataType output_data_type = is_arg_min_max ? DataType::S32 : input->info()->data_type();

1728

auto_init_if_empty(*output->info(), input->info()->clone()->set_tensor_shape(output_shape).set_data_type(output_data_type).reset_padding().set_is_resizable(true));

John Richardson