tests/validation/CL/Winograd.cpp - ml/ComputeLibrary - Gitiles

 /*
  * Copyright (c) 2018 ARM Limited.
  *
  * SPDX-License-Identifier: MIT
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to
  * deal in the Software without restriction, including without limitation the
  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
  * sell copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in all
  * copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  * SOFTWARE.
  */
 #include "arm_compute/core/CL/kernels/CLWinogradFilterTransformKernel.h"
 #include "arm_compute/core/CL/kernels/CLWinogradOutputTransformKernel.h"
 #include "arm_compute/core/Types.h"
 #include "arm_compute/core/utils/misc/ShapeCalculator.h"
 #include "arm_compute/runtime/CL/CLTensor.h"
 #include "arm_compute/runtime/CL/CLTensorAllocator.h"
 #include "arm_compute/runtime/CL/functions/CLWinogradConvolutionLayer.h"
 #include "arm_compute/runtime/CL/functions/CLWinogradInputTransform.h"
 #include "tests/CL/CLAccessor.h"
 #include "tests/CL/Helper.h"
 #include "tests/PaddingCalculator.h"
 #include "tests/datasets/LargeConvolutionLayerDataset.h"
 #include "tests/datasets/ShapeDatasets.h"
 #include "tests/datasets/SmallConvolutionLayerDataset.h"
 #include "tests/datasets/WinogradFilterTransformDataset.h"
 #include "tests/datasets/WinogradInputTransformDataset.h"
 #include "tests/datasets/WinogradOutputTransformDataset.h"
 #include "tests/framework/Asserts.h"
 #include "tests/framework/Macros.h"
 #include "tests/framework/datasets/Datasets.h"
 #include "tests/validation/Validation.h"
 #include "tests/validation/fixtures/WinogradLayerFixture.h"

 namespace arm_compute
 {
 namespace test
 {
 namespace validation
 {
 namespace
 {
 constexpr AbsoluteTolerance<float> tolerance_f32(0.001f);
 } // namespace

 using namespace arm_compute::misc::shape_calculator;

 TEST_SUITE(CL)
 TEST_SUITE(Winograd)

 TEST_SUITE(InputTransform)

 // *INDENT-OFF*
 // clang-format off
 DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(zip(zip(
                                                 framework::dataset::make("InputInfo",{
                                                                                         TensorInfo(TensorShape(53U, 21U, 5U, 3U), 1, DataType::F16),     // F16 not supported
                                                                                         TensorInfo(TensorShape(53U, 21U, 5U, 3U), 1, DataType::QASYMM8), // QASYMM8 not supported
                                                                                         TensorInfo(TensorShape(53U, 21U, 5U, 3U), 1, DataType::F32),     // Kernel size not supported
                                                                                         TensorInfo(TensorShape(53U, 21U, 5U, 3U), 1, DataType::F32),     // Strides not supported
                                                                                         TensorInfo(TensorShape(53U, 33U, 4U), 1, DataType::F32),         // Padding needed
                                                                                         TensorInfo(TensorShape(34U, 42U, 7U, 3U), 1, DataType::F32),     // Padding needed
                                                                                         TensorInfo(TensorShape(31U, 37U, 37U), 1, DataType::F32)         // Padding needed
                                                                                     }),
                                                 framework::dataset::make("OutputInfo", {
                                                                                         TensorInfo(TensorShape(5U, 5U, 16U, 3U), 1, DataType::F16),
                                                                                         TensorInfo(TensorShape(5U, 5U, 16U, 3U), 1, DataType::QASYMM8),
                                                                                         TensorInfo(TensorShape(5U, 5U, 16U, 3U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(5U, 1U, 16U, 3U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(4U, 442U, 16U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(7U, 320U, 16U, 3U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(37U, 304U, 16U), 1, DataType::F32)
                                                                                     })),
                                                 framework::dataset::make("PadStrideInfo", {
                                                                                         PadStrideInfo(1, 1, 1, 0),
                                                                                         PadStrideInfo(1, 1, 0, 0),
                                                                                         PadStrideInfo(1, 1, 1, 1),
                                                                                         PadStrideInfo(2, 1, 1, 1),
                                                                                         PadStrideInfo(1, 1, 0, 1),
                                                                                         PadStrideInfo(1, 1, 0, 0),
                                                                                         PadStrideInfo(1, 1, 1, 1)
                                                                                     })),
                                                 framework::dataset::make("KernelDims", {
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(5U, 5U),
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(3U, 3U)
                                                                                     })),
                                                 framework::dataset::make("Expected", { false, false, false, false, false, false, false })),
                                             input_info, output_info, conv_info, kernel_dims, expected)
 {
     ARM_COMPUTE_EXPECT(bool(CLWinogradInputTransform::validate(&input_info.clone()->set_is_resizable(false), &output_info.clone()->set_is_resizable(false), conv_info, kernel_dims)) == expected, framework::LogLevel::ERRORS);
 }
 // clang-format on
 // *INDENT-ON*

 using CLWinogradInputTransformFixture = WinogradInputTransformValidationFixture<CLTensor, CLAccessor, CLWinogradInputTransform, float>;

 DATA_TEST_CASE(Configuration, framework::DatasetMode::ALL, combine(framework::dataset::concat(datasets::SmallWinogradInputTransformDataset(), datasets::LargeWinogradInputTransformDataset()),
                                                                    framework::dataset::make("DataType", { DataType::F32 })),
                shape_in, conv_info, kernel_dims, is_nchw_format, data_type)
 {
     ARM_COMPUTE_UNUSED(is_nchw_format);

     TensorShape shape_out = compute_winograd_input_transform_shape(TensorInfo(shape_in, 1, data_type), conv_info, kernel_dims);

     // Create tensors
     CLTensor in  = create_tensor<CLTensor>(shape_in, data_type);
     CLTensor out = create_tensor<CLTensor>(shape_out, data_type);

     ARM_COMPUTE_EXPECT(in.info()->is_resizable(), framework::LogLevel::ERRORS);
     ARM_COMPUTE_EXPECT(out.info()->is_resizable(), framework::LogLevel::ERRORS);

     // Create and configure function
     CLWinogradInputTransform winograd_input_transform;

     // Configure the function
     winograd_input_transform.configure(&in, &out, conv_info, kernel_dims);
 }

 FIXTURE_DATA_TEST_CASE(RunSmall, CLWinogradInputTransformFixture, framework::DatasetMode::PRECOMMIT, combine(datasets::SmallWinogradInputTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
 {
     validate(CLAccessor(_target), _reference);
 }

 FIXTURE_DATA_TEST_CASE(RunLarge, CLWinogradInputTransformFixture, framework::DatasetMode::NIGHTLY, combine(datasets::LargeWinogradInputTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
 {
     validate(CLAccessor(_target), _reference);
 }
 TEST_SUITE_END() // InputTransform

 TEST_SUITE(FilterTransform)
 // *INDENT-OFF*
 // clang-format off
 DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(
                                                 framework::dataset::make("InputInfo",{
                                                                                         TensorInfo(TensorShape(3U, 3U, 5U, 3U), 1, DataType::F16),     // F16 not supported
                                                                                         TensorInfo(TensorShape(3U, 3U, 5U, 3U), 1, DataType::QASYMM8), // QASYMM8 not supported
                                                                                         TensorInfo(TensorShape(5U, 5U, 5U, 3U), 1, DataType::F32),     // Kernel size not supported
                                                                                         TensorInfo(TensorShape(3U, 3U), 1, DataType::F32),             // valid
                                                                                         TensorInfo(TensorShape(3U, 3U, 5U, 3U), 1, DataType::F32),     // valid
                                                                                         TensorInfo(TensorShape(3U, 3U, 37U, 2U), 1, DataType::F32),    // valid
                                                                                         TensorInfo(TensorShape(3U, 3U, 37U, 22U), 1, DataType::F32)    // valid
                                                                                     }),
                                                 framework::dataset::make("OutputInfo", {
                                                                                         TensorInfo(TensorShape(3U, 5U, 16U), 1, DataType::F16),
                                                                                         TensorInfo(TensorShape(3U, 5U, 16U), 1, DataType::QASYMM8),
                                                                                         TensorInfo(TensorShape(3U, 5U, 16U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(1U, 1U, 16U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(3U, 5U, 16U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(2U, 37U, 16U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(22U, 37U, 16U), 1, DataType::F32)
                                                                                     })),
                                                 framework::dataset::make("Expected", { false, false, false, true, true, true, true })),
                                             input_info, output_info, expected)
 {
     ARM_COMPUTE_EXPECT(bool(CLWinogradFilterTransformKernel::validate(&input_info.clone()->set_is_resizable(false), &output_info.clone()->set_is_resizable(false))) == expected, framework::LogLevel::ERRORS);
 }
 // clang-format on
 // *INDENT-ON*

 using CLWinogradFilterTransform        = CLSynthetizeFunctionWithZeroConstantBorder<CLWinogradFilterTransformKernel, 0>;
 using CLWinogradFilterTransformFixture = WinogradFilterTransformValidationFixture<CLTensor, CLAccessor, CLWinogradFilterTransform, float>;

 DATA_TEST_CASE(Configuration, framework::DatasetMode::ALL, combine(framework::dataset::concat(datasets::SmallWinogradFilterTransformDataset(), datasets::LargeWinogradFilterTransformDataset()),
                                                                    framework::dataset::make("DataType", { DataType::F32 })),
                shape_a, is_nchw_format, data_type)
 {
     ARM_COMPUTE_UNUSED(is_nchw_format);

     TensorShape shape_b = compute_winograd_filter_transform_shape(TensorInfo(shape_a, 1, data_type));

     // Create tensors
     CLTensor a = create_tensor<CLTensor>(shape_a, data_type);
     CLTensor b = create_tensor<CLTensor>(shape_b, data_type);

     ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);
     ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

     // Create and configure function
     CLWinogradFilterTransform winograd_filter_transform;
     winograd_filter_transform.configure(&a, &b);
 }

 FIXTURE_DATA_TEST_CASE(RunSmall, CLWinogradFilterTransformFixture, framework::DatasetMode::ALL, combine(datasets::SmallWinogradFilterTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
 {
     // Validate output
     validate(CLAccessor(_target), _reference, tolerance_f32);
 }

 FIXTURE_DATA_TEST_CASE(RunLarge, CLWinogradFilterTransformFixture, framework::DatasetMode::NIGHTLY, combine(datasets::LargeWinogradFilterTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
 {
     // Validate output
     validate(CLAccessor(_target), _reference, tolerance_f32);
 }

 TEST_SUITE_END() // FilterTransform

 TEST_SUITE(OutputTransform)
 // *INDENT-OFF*
 // clang-format off
 DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(zip(zip(zip(zip(
                                                 framework::dataset::make("InputInfo",{
                                                                                         TensorInfo(TensorShape(24U, 49U, 16U, 5U), 1, DataType::F16),        // F16 not supported
                                                                                         TensorInfo(TensorShape(128U, 3136U, 16U, 5U), 1, DataType::QASYMM8), // QASYMM8 not supported
                                                                                         TensorInfo(TensorShape(256U, 784U, 16U, 5U), 1, DataType::F32),      // Kernel size not supported
                                                                                         TensorInfo(TensorShape(512U, 169U, 16U, 5U), 1, DataType::F32),      // Valid
                                                                                         TensorInfo(TensorShape(13U, 6U, 16U, 4U), 1, DataType::F32),         // Padding needed
                                                                                         TensorInfo(TensorShape(7U, 16U, 16U, 7U), 1, DataType::F32),         // Valid
                                                                                         TensorInfo(TensorShape(1U, 442U, 16U, 37U), 1, DataType::F32)        // Wrong number of tiles
                                                                                     }),
                                                 framework::dataset::make("BiasInfo", {
                                                                                         TensorInfo(TensorShape(24U), 1, DataType::F16),
                                                                                         TensorInfo(TensorShape(128U), 1, DataType::QASYMM8),
                                                                                         TensorInfo(TensorShape(256U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(512U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(13U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(7U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(1U), 1, DataType::F32)
                                                                                     })),
                                                 framework::dataset::make("OutputInfo", {
                                                                                         TensorInfo(TensorShape(14U, 14U, 24U, 5U), 1, DataType::F16),
                                                                                         TensorInfo(TensorShape(112U, 112U, 128U, 5U), 1, DataType::QASYMM8),
                                                                                         TensorInfo(TensorShape(55U, 55U, 256U, 5U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(26U, 26U, 512U, 5U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(5U, 4U, 13U, 4U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(8U, 8U, 7U, 7U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(51U, 33U, 1U, 37U), 1, DataType::F32)
                                                                                     })),
                                                 framework::dataset::make("KernelDims", {
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(5U, 5U),
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(3U, 3U),
                                                                                         Size2D(3U, 3U)
                                                                                     })),
                                                 framework::dataset::make("OutputDims", {
                                                                                         Size2D(14U, 14U),
                                                                                         Size2D(112U, 112U),
                                                                                         Size2D(55U, 55U),
                                                                                         Size2D(26U, 26U),
                                                                                         Size2D(5U, 4U),
                                                                                         Size2D(8U, 8U),
                                                                                         Size2D(51U, 33U)
                                                                                     })),
                                                 framework::dataset::make("NumTiles", {
                                                                                         Size2D(7U, 7U),
                                                                                         Size2D(56U, 56U),
                                                                                         Size2D(28U, 28U),
                                                                                         Size2D(13U, 13U),
                                                                                         Size2D(3U, 2U),
                                                                                         Size2D(4U, 4U),
                                                                                         Size2D(26U, 16U)
                                                                                     })),
                                                 framework::dataset::make("Expected", { false, false, false, true, false, true, false })),
                                             input_info, bias_info, output_info, kernel_dims, output_dims, num_tiles, expected)
 {
     ARM_COMPUTE_EXPECT(bool(CLWinogradOutputTransformKernel::validate(&input_info.clone()->set_is_resizable(false), &bias_info.clone()->set_is_resizable(false), &output_info.clone()->set_is_resizable(false), kernel_dims, output_dims, num_tiles)) == expected, framework::LogLevel::ERRORS);
 }
 // clang-format on
 // *INDENT-ON*

 using CLWinogradOutputTransform        = CLSynthetizeFunctionWithZeroConstantBorder<CLWinogradOutputTransformKernel, 0>;
 using CLWinogradOutputTransformFixture = WinogradOutputTransformValidationFixture<CLTensor, CLAccessor, CLWinogradOutputTransform, float>;

 DATA_TEST_CASE(Configuration, framework::DatasetMode::ALL, combine(framework::dataset::concat(datasets::SmallWinogradOutputTransformDataset(), datasets::LargeWinogradOutputTransformDataset()),
                                                                    framework::dataset::make("DataType", { DataType::F32 })),
                shape_a, kernel_dims, output_convolved_dims, num_tiles, data_layout, data_type)
 {
     TensorShape shape_b = compute_winograd_output_transform_shape(TensorInfo(shape_a, 1, data_type), output_convolved_dims, data_layout);

     // Create tensors
     CLTensor a = create_tensor<CLTensor>(shape_a, data_type);
     CLTensor b = create_tensor<CLTensor>(shape_b, data_type);

     ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);
     ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

     // Create and configure function
     CLWinogradOutputTransform winograd_output_transform;
     winograd_output_transform.configure(&a, nullptr, &b, kernel_dims, output_convolved_dims, num_tiles);
 }

 FIXTURE_DATA_TEST_CASE(RunSmall, CLWinogradOutputTransformFixture, framework::DatasetMode::ALL, combine(datasets::SmallWinogradOutputTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
 {
     // Validate output
     validate(CLAccessor(_target), _reference, tolerance_f32);
 }

 FIXTURE_DATA_TEST_CASE(RunLarge, CLWinogradOutputTransformFixture, framework::DatasetMode::NIGHTLY, combine(datasets::LargeWinogradOutputTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
 {
     // Validate output
     validate(CLAccessor(_target), _reference, tolerance_f32);
 }

 TEST_SUITE_END() // OutputTransform

 TEST_SUITE(ConvolutionLayer)
 // *INDENT-OFF*
 // clang-format off
 DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(zip(zip(zip(
                                                 framework::dataset::make("InputInfo", {
                                                                                         TensorInfo(TensorShape(17U, 31U, 2U), 1, DataType::F16),     // FP16 not supported
                                                                                         TensorInfo(TensorShape(17U, 31U, 2U), 1, DataType::F32),     // Datatype mismatch
                                                                                         TensorInfo(TensorShape(23U, 27U, 5U, 4U), 1, DataType::F32), // Stride y not supported
                                                                                         TensorInfo(TensorShape(16U, 16U, 8U), 1, DataType::F32),     // Padding needed
                                                                                         TensorInfo(TensorShape(33U, 27U, 7U, 4U), 1, DataType::F32)  // Kernel size not supported
                                                                                       }),
                                                 framework::dataset::make("WeightsInfo", {
                                                                                         TensorInfo(TensorShape(3U, 3U, 2U, 19U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(3U, 3U, 2U, 19U), 1, DataType::QASYMM8),
                                                                                         TensorInfo(TensorShape(3U, 3U, 5U, 21U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(3U, 3U, 8U, 16U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(5U, 5U, 7U, 16U), 1, DataType::F16)
                                                                                         })),
                                                 framework::dataset::make("BiasesInfo", {
                                                                                         TensorInfo(TensorShape(19U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(19U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(21U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(16U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(16U), 1, DataType::F32)
                                                                                        })),
                                                 framework::dataset::make("OutputInfo", {
                                                                                         TensorInfo(TensorShape(17U, 31U, 19U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(15U, 15U, 19U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(21U, 25U, 21U, 4U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(16U, 16U, 16U), 1, DataType::F32),
                                                                                         TensorInfo(TensorShape(11U, 12U, 16U, 4U), 1, DataType::F32)
                                                                                        })),
                                                 framework::dataset::make("ConvInfo", {
                                                                                         PadStrideInfo(1, 1, 1, 1),
                                                                                         PadStrideInfo(1, 1, 1, 1),
                                                                                         PadStrideInfo(1, 2, 0, 0),
                                                                                         PadStrideInfo(1, 1, 1, 1),
                                                                                         PadStrideInfo(1, 1, 1, 0)
                                                                                                                  })),
                                                 framework::dataset::make("Expected", { false, false, false, false, false })),
                input_info, weights_info, bias_info, output_info, conv_info, expected)
 {
     ARM_COMPUTE_EXPECT(bool(CLWinogradConvolutionLayer::validate(&input_info.clone()->set_is_resizable(false), &weights_info.clone()->set_is_resizable(false), &bias_info.clone()->set_is_resizable(false), &output_info.clone()->set_is_resizable(false), conv_info)) == expected, framework::LogLevel::ERRORS);
 }
 // clang-format on
 // *INDENT-ON*

 using CLWinogradConvolutionLayerFixture = WinogradConvolutionLayerValidationFixture<CLTensor, CLAccessor, CLWinogradConvolutionLayer, float>;
 FIXTURE_DATA_TEST_CASE(RunSmall, CLWinogradConvolutionLayerFixture, framework::DatasetMode::PRECOMMIT, combine(datasets::SmallWinogradConvolutionLayer3x3Dataset(),
                                                                                                                framework::dataset::make("DataType", { DataType::F32 })))
 {
     // Validate output
     validate(CLAccessor(_target), _reference, tolerance_f32);
 }

 FIXTURE_DATA_TEST_CASE(RunLarge, CLWinogradConvolutionLayerFixture, framework::DatasetMode::NIGHTLY, combine(datasets::LargeWinogradConvolutionLayer3x3Dataset(), framework::dataset::make("DataType", { DataType::F32 })))
 {
     // Validate output
     validate(CLAccessor(_target), _reference, tolerance_f32);
 }
 TEST_SUITE_END() // ConvolutionLayer

 TEST_SUITE_END() // Winograd
 TEST_SUITE_END() // CL
 } // namespace validation
 } // namespace test
 } // namespace arm_compute
	/*
	* Copyright (c) 2018 ARM Limited.
	*
	* SPDX-License-Identifier: MIT
	*
	* Permission is hereby granted, free of charge, to any person obtaining a copy
	* of this software and associated documentation files (the "Software"), to
	* deal in the Software without restriction, including without limitation the
	* rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
	* sell copies of the Software, and to permit persons to whom the Software is
	* furnished to do so, subject to the following conditions:
	*
	* The above copyright notice and this permission notice shall be included in all
	* copies or substantial portions of the Software.
	*
	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
	* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
	* SOFTWARE.
	*/
	#include "arm_compute/core/CL/kernels/CLWinogradFilterTransformKernel.h"
	#include "arm_compute/core/CL/kernels/CLWinogradOutputTransformKernel.h"
	#include "arm_compute/core/Types.h"
	#include "arm_compute/core/utils/misc/ShapeCalculator.h"
	#include "arm_compute/runtime/CL/CLTensor.h"
	#include "arm_compute/runtime/CL/CLTensorAllocator.h"
	#include "arm_compute/runtime/CL/functions/CLWinogradConvolutionLayer.h"
	#include "arm_compute/runtime/CL/functions/CLWinogradInputTransform.h"
	#include "tests/CL/CLAccessor.h"
	#include "tests/CL/Helper.h"
	#include "tests/PaddingCalculator.h"
	#include "tests/datasets/LargeConvolutionLayerDataset.h"
	#include "tests/datasets/ShapeDatasets.h"
	#include "tests/datasets/SmallConvolutionLayerDataset.h"
	#include "tests/datasets/WinogradFilterTransformDataset.h"
	#include "tests/datasets/WinogradInputTransformDataset.h"
	#include "tests/datasets/WinogradOutputTransformDataset.h"
	#include "tests/framework/Asserts.h"
	#include "tests/framework/Macros.h"
	#include "tests/framework/datasets/Datasets.h"
	#include "tests/validation/Validation.h"
	#include "tests/validation/fixtures/WinogradLayerFixture.h"

	namespace arm_compute
	{
	namespace test
	{
	namespace validation
	{
	namespace
	{
	constexpr AbsoluteTolerance<float> tolerance_f32(0.001f);
	} // namespace

	using namespace arm_compute::misc::shape_calculator;

	TEST_SUITE(CL)
	TEST_SUITE(Winograd)

	TEST_SUITE(InputTransform)

	// INDENT-OFF
	// clang-format off
	DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(zip(zip(
	framework::dataset::make("InputInfo",{
	TensorInfo(TensorShape(53U, 21U, 5U, 3U), 1, DataType::F16), // F16 not supported
	TensorInfo(TensorShape(53U, 21U, 5U, 3U), 1, DataType::QASYMM8), // QASYMM8 not supported
	TensorInfo(TensorShape(53U, 21U, 5U, 3U), 1, DataType::F32), // Kernel size not supported
	TensorInfo(TensorShape(53U, 21U, 5U, 3U), 1, DataType::F32), // Strides not supported
	TensorInfo(TensorShape(53U, 33U, 4U), 1, DataType::F32), // Padding needed
	TensorInfo(TensorShape(34U, 42U, 7U, 3U), 1, DataType::F32), // Padding needed
	TensorInfo(TensorShape(31U, 37U, 37U), 1, DataType::F32) // Padding needed
	}),
	framework::dataset::make("OutputInfo", {
	TensorInfo(TensorShape(5U, 5U, 16U, 3U), 1, DataType::F16),
	TensorInfo(TensorShape(5U, 5U, 16U, 3U), 1, DataType::QASYMM8),
	TensorInfo(TensorShape(5U, 5U, 16U, 3U), 1, DataType::F32),
	TensorInfo(TensorShape(5U, 1U, 16U, 3U), 1, DataType::F32),
	TensorInfo(TensorShape(4U, 442U, 16U), 1, DataType::F32),
	TensorInfo(TensorShape(7U, 320U, 16U, 3U), 1, DataType::F32),
	TensorInfo(TensorShape(37U, 304U, 16U), 1, DataType::F32)
	})),
	framework::dataset::make("PadStrideInfo", {
	PadStrideInfo(1, 1, 1, 0),
	PadStrideInfo(1, 1, 0, 0),
	PadStrideInfo(1, 1, 1, 1),
	PadStrideInfo(2, 1, 1, 1),
	PadStrideInfo(1, 1, 0, 1),
	PadStrideInfo(1, 1, 0, 0),
	PadStrideInfo(1, 1, 1, 1)
	})),
	framework::dataset::make("KernelDims", {
	Size2D(3U, 3U),
	Size2D(3U, 3U),
	Size2D(5U, 5U),
	Size2D(3U, 3U),
	Size2D(3U, 3U),
	Size2D(3U, 3U),
	Size2D(3U, 3U)
	})),
	framework::dataset::make("Expected", { false, false, false, false, false, false, false })),
	input_info, output_info, conv_info, kernel_dims, expected)
	{
	ARM_COMPUTE_EXPECT(bool(CLWinogradInputTransform::validate(&input_info.clone()->set_is_resizable(false), &output_info.clone()->set_is_resizable(false), conv_info, kernel_dims)) == expected, framework::LogLevel::ERRORS);
	}
	// clang-format on
	// INDENT-ON

	using CLWinogradInputTransformFixture = WinogradInputTransformValidationFixture<CLTensor, CLAccessor, CLWinogradInputTransform, float>;

	DATA_TEST_CASE(Configuration, framework::DatasetMode::ALL, combine(framework::dataset::concat(datasets::SmallWinogradInputTransformDataset(), datasets::LargeWinogradInputTransformDataset()),
	framework::dataset::make("DataType", { DataType::F32 })),
	shape_in, conv_info, kernel_dims, is_nchw_format, data_type)
	{
	ARM_COMPUTE_UNUSED(is_nchw_format);

	TensorShape shape_out = compute_winograd_input_transform_shape(TensorInfo(shape_in, 1, data_type), conv_info, kernel_dims);

	// Create tensors
	CLTensor in = create_tensor<CLTensor>(shape_in, data_type);
	CLTensor out = create_tensor<CLTensor>(shape_out, data_type);

	ARM_COMPUTE_EXPECT(in.info()->is_resizable(), framework::LogLevel::ERRORS);
	ARM_COMPUTE_EXPECT(out.info()->is_resizable(), framework::LogLevel::ERRORS);

	// Create and configure function
	CLWinogradInputTransform winograd_input_transform;

	// Configure the function
	winograd_input_transform.configure(&in, &out, conv_info, kernel_dims);
	}

	FIXTURE_DATA_TEST_CASE(RunSmall, CLWinogradInputTransformFixture, framework::DatasetMode::PRECOMMIT, combine(datasets::SmallWinogradInputTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
	{
	validate(CLAccessor(_target), _reference);
	}

	FIXTURE_DATA_TEST_CASE(RunLarge, CLWinogradInputTransformFixture, framework::DatasetMode::NIGHTLY, combine(datasets::LargeWinogradInputTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
	{
	validate(CLAccessor(_target), _reference);
	}
	TEST_SUITE_END() // InputTransform

	TEST_SUITE(FilterTransform)
	// INDENT-OFF
	// clang-format off
	DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(
	framework::dataset::make("InputInfo",{
	TensorInfo(TensorShape(3U, 3U, 5U, 3U), 1, DataType::F16), // F16 not supported
	TensorInfo(TensorShape(3U, 3U, 5U, 3U), 1, DataType::QASYMM8), // QASYMM8 not supported
	TensorInfo(TensorShape(5U, 5U, 5U, 3U), 1, DataType::F32), // Kernel size not supported
	TensorInfo(TensorShape(3U, 3U), 1, DataType::F32), // valid
	TensorInfo(TensorShape(3U, 3U, 5U, 3U), 1, DataType::F32), // valid
	TensorInfo(TensorShape(3U, 3U, 37U, 2U), 1, DataType::F32), // valid
	TensorInfo(TensorShape(3U, 3U, 37U, 22U), 1, DataType::F32) // valid
	}),
	framework::dataset::make("OutputInfo", {
	TensorInfo(TensorShape(3U, 5U, 16U), 1, DataType::F16),
	TensorInfo(TensorShape(3U, 5U, 16U), 1, DataType::QASYMM8),
	TensorInfo(TensorShape(3U, 5U, 16U), 1, DataType::F32),
	TensorInfo(TensorShape(1U, 1U, 16U), 1, DataType::F32),
	TensorInfo(TensorShape(3U, 5U, 16U), 1, DataType::F32),
	TensorInfo(TensorShape(2U, 37U, 16U), 1, DataType::F32),
	TensorInfo(TensorShape(22U, 37U, 16U), 1, DataType::F32)
	})),
	framework::dataset::make("Expected", { false, false, false, true, true, true, true })),
	input_info, output_info, expected)
	{
	ARM_COMPUTE_EXPECT(bool(CLWinogradFilterTransformKernel::validate(&input_info.clone()->set_is_resizable(false), &output_info.clone()->set_is_resizable(false))) == expected, framework::LogLevel::ERRORS);
	}
	// clang-format on
	// INDENT-ON

	using CLWinogradFilterTransform = CLSynthetizeFunctionWithZeroConstantBorder<CLWinogradFilterTransformKernel, 0>;
	using CLWinogradFilterTransformFixture = WinogradFilterTransformValidationFixture<CLTensor, CLAccessor, CLWinogradFilterTransform, float>;

	DATA_TEST_CASE(Configuration, framework::DatasetMode::ALL, combine(framework::dataset::concat(datasets::SmallWinogradFilterTransformDataset(), datasets::LargeWinogradFilterTransformDataset()),
	framework::dataset::make("DataType", { DataType::F32 })),
	shape_a, is_nchw_format, data_type)
	{
	ARM_COMPUTE_UNUSED(is_nchw_format);

	TensorShape shape_b = compute_winograd_filter_transform_shape(TensorInfo(shape_a, 1, data_type));

	// Create tensors
	CLTensor a = create_tensor<CLTensor>(shape_a, data_type);
	CLTensor b = create_tensor<CLTensor>(shape_b, data_type);

	ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);
	ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

	// Create and configure function
	CLWinogradFilterTransform winograd_filter_transform;
	winograd_filter_transform.configure(&a, &b);
	}

	FIXTURE_DATA_TEST_CASE(RunSmall, CLWinogradFilterTransformFixture, framework::DatasetMode::ALL, combine(datasets::SmallWinogradFilterTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
	{
	// Validate output
	validate(CLAccessor(_target), _reference, tolerance_f32);
	}

	FIXTURE_DATA_TEST_CASE(RunLarge, CLWinogradFilterTransformFixture, framework::DatasetMode::NIGHTLY, combine(datasets::LargeWinogradFilterTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
	{
	// Validate output
	validate(CLAccessor(_target), _reference, tolerance_f32);
	}

	TEST_SUITE_END() // FilterTransform

	TEST_SUITE(OutputTransform)
	// INDENT-OFF
	// clang-format off
	DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(zip(zip(zip(zip(
	framework::dataset::make("InputInfo",{
	TensorInfo(TensorShape(24U, 49U, 16U, 5U), 1, DataType::F16), // F16 not supported
	TensorInfo(TensorShape(128U, 3136U, 16U, 5U), 1, DataType::QASYMM8), // QASYMM8 not supported
	TensorInfo(TensorShape(256U, 784U, 16U, 5U), 1, DataType::F32), // Kernel size not supported
	TensorInfo(TensorShape(512U, 169U, 16U, 5U), 1, DataType::F32), // Valid
	TensorInfo(TensorShape(13U, 6U, 16U, 4U), 1, DataType::F32), // Padding needed
	TensorInfo(TensorShape(7U, 16U, 16U, 7U), 1, DataType::F32), // Valid
	TensorInfo(TensorShape(1U, 442U, 16U, 37U), 1, DataType::F32) // Wrong number of tiles
	}),
	framework::dataset::make("BiasInfo", {
	TensorInfo(TensorShape(24U), 1, DataType::F16),
	TensorInfo(TensorShape(128U), 1, DataType::QASYMM8),
	TensorInfo(TensorShape(256U), 1, DataType::F32),
	TensorInfo(TensorShape(512U), 1, DataType::F32),
	TensorInfo(TensorShape(13U), 1, DataType::F32),
	TensorInfo(TensorShape(7U), 1, DataType::F32),
	TensorInfo(TensorShape(1U), 1, DataType::F32)
	})),
	framework::dataset::make("OutputInfo", {
	TensorInfo(TensorShape(14U, 14U, 24U, 5U), 1, DataType::F16),
	TensorInfo(TensorShape(112U, 112U, 128U, 5U), 1, DataType::QASYMM8),
	TensorInfo(TensorShape(55U, 55U, 256U, 5U), 1, DataType::F32),
	TensorInfo(TensorShape(26U, 26U, 512U, 5U), 1, DataType::F32),
	TensorInfo(TensorShape(5U, 4U, 13U, 4U), 1, DataType::F32),
	TensorInfo(TensorShape(8U, 8U, 7U, 7U), 1, DataType::F32),
	TensorInfo(TensorShape(51U, 33U, 1U, 37U), 1, DataType::F32)
	})),
	framework::dataset::make("KernelDims", {
	Size2D(3U, 3U),
	Size2D(3U, 3U),
	Size2D(5U, 5U),
	Size2D(3U, 3U),
	Size2D(3U, 3U),
	Size2D(3U, 3U),
	Size2D(3U, 3U)
	})),
	framework::dataset::make("OutputDims", {
	Size2D(14U, 14U),
	Size2D(112U, 112U),
	Size2D(55U, 55U),
	Size2D(26U, 26U),
	Size2D(5U, 4U),
	Size2D(8U, 8U),
	Size2D(51U, 33U)
	})),
	framework::dataset::make("NumTiles", {
	Size2D(7U, 7U),
	Size2D(56U, 56U),
	Size2D(28U, 28U),
	Size2D(13U, 13U),
	Size2D(3U, 2U),
	Size2D(4U, 4U),
	Size2D(26U, 16U)
	})),
	framework::dataset::make("Expected", { false, false, false, true, false, true, false })),
	input_info, bias_info, output_info, kernel_dims, output_dims, num_tiles, expected)
	{
	ARM_COMPUTE_EXPECT(bool(CLWinogradOutputTransformKernel::validate(&input_info.clone()->set_is_resizable(false), &bias_info.clone()->set_is_resizable(false), &output_info.clone()->set_is_resizable(false), kernel_dims, output_dims, num_tiles)) == expected, framework::LogLevel::ERRORS);
	}
	// clang-format on
	// INDENT-ON

	using CLWinogradOutputTransform = CLSynthetizeFunctionWithZeroConstantBorder<CLWinogradOutputTransformKernel, 0>;
	using CLWinogradOutputTransformFixture = WinogradOutputTransformValidationFixture<CLTensor, CLAccessor, CLWinogradOutputTransform, float>;

	DATA_TEST_CASE(Configuration, framework::DatasetMode::ALL, combine(framework::dataset::concat(datasets::SmallWinogradOutputTransformDataset(), datasets::LargeWinogradOutputTransformDataset()),
	framework::dataset::make("DataType", { DataType::F32 })),
	shape_a, kernel_dims, output_convolved_dims, num_tiles, data_layout, data_type)
	{
	TensorShape shape_b = compute_winograd_output_transform_shape(TensorInfo(shape_a, 1, data_type), output_convolved_dims, data_layout);

	// Create tensors
	CLTensor a = create_tensor<CLTensor>(shape_a, data_type);
	CLTensor b = create_tensor<CLTensor>(shape_b, data_type);

	ARM_COMPUTE_EXPECT(a.info()->is_resizable(), framework::LogLevel::ERRORS);
	ARM_COMPUTE_EXPECT(b.info()->is_resizable(), framework::LogLevel::ERRORS);

	// Create and configure function
	CLWinogradOutputTransform winograd_output_transform;
	winograd_output_transform.configure(&a, nullptr, &b, kernel_dims, output_convolved_dims, num_tiles);
	}

	FIXTURE_DATA_TEST_CASE(RunSmall, CLWinogradOutputTransformFixture, framework::DatasetMode::ALL, combine(datasets::SmallWinogradOutputTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
	{
	// Validate output
	validate(CLAccessor(_target), _reference, tolerance_f32);
	}

	FIXTURE_DATA_TEST_CASE(RunLarge, CLWinogradOutputTransformFixture, framework::DatasetMode::NIGHTLY, combine(datasets::LargeWinogradOutputTransformDataset(), framework::dataset::make("DataType", { DataType::F32 })))
	{
	// Validate output
	validate(CLAccessor(_target), _reference, tolerance_f32);
	}

	TEST_SUITE_END() // OutputTransform

	TEST_SUITE(ConvolutionLayer)
	// INDENT-OFF
	// clang-format off
	DATA_TEST_CASE(Validate, framework::DatasetMode::ALL, zip(zip(zip(zip(zip(
	framework::dataset::make("InputInfo", {
	TensorInfo(TensorShape(17U, 31U, 2U), 1, DataType::F16), // FP16 not supported
	TensorInfo(TensorShape(17U, 31U, 2U), 1, DataType::F32), // Datatype mismatch
	TensorInfo(TensorShape(23U, 27U, 5U, 4U), 1, DataType::F32), // Stride y not supported
	TensorInfo(TensorShape(16U, 16U, 8U), 1, DataType::F32), // Padding needed
	TensorInfo(TensorShape(33U, 27U, 7U, 4U), 1, DataType::F32) // Kernel size not supported
	}),
	framework::dataset::make("WeightsInfo", {
	TensorInfo(TensorShape(3U, 3U, 2U, 19U), 1, DataType::F32),
	TensorInfo(TensorShape(3U, 3U, 2U, 19U), 1, DataType::QASYMM8),
	TensorInfo(TensorShape(3U, 3U, 5U, 21U), 1, DataType::F32),
	TensorInfo(TensorShape(3U, 3U, 8U, 16U), 1, DataType::F32),
	TensorInfo(TensorShape(5U, 5U, 7U, 16U), 1, DataType::F16)
	})),
	framework::dataset::make("BiasesInfo", {
	TensorInfo(TensorShape(19U), 1, DataType::F32),
	TensorInfo(TensorShape(19U), 1, DataType::F32),
	TensorInfo(TensorShape(21U), 1, DataType::F32),
	TensorInfo(TensorShape(16U), 1, DataType::F32),
	TensorInfo(TensorShape(16U), 1, DataType::F32)
	})),
	framework::dataset::make("OutputInfo", {
	TensorInfo(TensorShape(17U, 31U, 19U), 1, DataType::F32),
	TensorInfo(TensorShape(15U, 15U, 19U), 1, DataType::F32),
	TensorInfo(TensorShape(21U, 25U, 21U, 4U), 1, DataType::F32),
	TensorInfo(TensorShape(16U, 16U, 16U), 1, DataType::F32),
	TensorInfo(TensorShape(11U, 12U, 16U, 4U), 1, DataType::F32)
	})),
	framework::dataset::make("ConvInfo", {
	PadStrideInfo(1, 1, 1, 1),
	PadStrideInfo(1, 1, 1, 1),
	PadStrideInfo(1, 2, 0, 0),
	PadStrideInfo(1, 1, 1, 1),
	PadStrideInfo(1, 1, 1, 0)
	})),
	framework::dataset::make("Expected", { false, false, false, false, false })),
	input_info, weights_info, bias_info, output_info, conv_info, expected)
	{
	ARM_COMPUTE_EXPECT(bool(CLWinogradConvolutionLayer::validate(&input_info.clone()->set_is_resizable(false), &weights_info.clone()->set_is_resizable(false), &bias_info.clone()->set_is_resizable(false), &output_info.clone()->set_is_resizable(false), conv_info)) == expected, framework::LogLevel::ERRORS);
	}
	// clang-format on
	// INDENT-ON

	using CLWinogradConvolutionLayerFixture = WinogradConvolutionLayerValidationFixture<CLTensor, CLAccessor, CLWinogradConvolutionLayer, float>;
	FIXTURE_DATA_TEST_CASE(RunSmall, CLWinogradConvolutionLayerFixture, framework::DatasetMode::PRECOMMIT, combine(datasets::SmallWinogradConvolutionLayer3x3Dataset(),
	framework::dataset::make("DataType", { DataType::F32 })))
	{
	// Validate output
	validate(CLAccessor(_target), _reference, tolerance_f32);
	}

	FIXTURE_DATA_TEST_CASE(RunLarge, CLWinogradConvolutionLayerFixture, framework::DatasetMode::NIGHTLY, combine(datasets::LargeWinogradConvolutionLayer3x3Dataset(), framework::dataset::make("DataType", { DataType::F32 })))
	{
	// Validate output
	validate(CLAccessor(_target), _reference, tolerance_f32);
	}
	TEST_SUITE_END() // ConvolutionLayer

	TEST_SUITE_END() // Winograd
	TEST_SUITE_END() // CL
	} // namespace validation
	} // namespace test
	} // namespace arm_compute