blob: 1f3f9b540a843b6cc6a42a95f1894ebc74d03b27 [file] [log] [blame]
telsoa014fcda012018-03-09 14:13:49 +00001//
2// Copyright © 2017 Arm Ltd. All rights reserved.
David Beckecb56cd2018-09-05 12:52:57 +01003// SPDX-License-Identifier: MIT
telsoa014fcda012018-03-09 14:13:49 +00004//
5
arovir019e53a352018-08-31 15:26:35 +01006#include "ClBatchNormalizationFloatWorkload.hpp"
David Beckac42efd2018-09-26 17:41:13 +01007#include <backends/cl/ClTensorHandle.hpp>
David Beck711fa312018-09-24 10:46:38 +01008#include <backends/CpuTensorHandle.hpp>
9#include <backends/aclCommon/ArmComputeTensorUtils.hpp>
David Beckac42efd2018-09-26 17:41:13 +010010#include <backends/cl/ClLayerSupport.hpp>
telsoa014fcda012018-03-09 14:13:49 +000011
Matthew Bentham14e46692018-09-20 15:35:30 +010012#include "ClWorkloadUtils.hpp"
13
telsoa014fcda012018-03-09 14:13:49 +000014namespace armnn
15{
16using namespace armcomputetensorutils;
17
telsoa01c577f2c2018-08-31 09:22:23 +010018arm_compute::Status ClBatchNormalizationValidate(const TensorInfo& input,
19 const TensorInfo& output,
20 const TensorInfo& mean,
21 const TensorInfo& var,
22 const TensorInfo& beta,
23 const TensorInfo& gamma,
24 const BatchNormalizationDescriptor &desc)
25{
Nikhil Rajd1340932018-10-18 14:27:50 +010026 const DataLayout dataLayout = desc.m_DataLayout.GetDataLayout();
27
28 const arm_compute::TensorInfo aclInputInfo =
29 armcomputetensorutils::BuildArmComputeTensorInfo(input, dataLayout);
30 const arm_compute::TensorInfo aclOutputInfo =
31 armcomputetensorutils::BuildArmComputeTensorInfo(output, dataLayout);
32 const arm_compute::TensorInfo aclMeanInfo =
33 armcomputetensorutils::BuildArmComputeTensorInfo(mean, dataLayout);
34 const arm_compute::TensorInfo aclVarInfo =
35 armcomputetensorutils::BuildArmComputeTensorInfo(var, dataLayout);
36 const arm_compute::TensorInfo aclBetaInfo =
37 armcomputetensorutils::BuildArmComputeTensorInfo(beta, dataLayout);
38 const arm_compute::TensorInfo aclGammaInfo =
39 armcomputetensorutils::BuildArmComputeTensorInfo(gamma, dataLayout);
telsoa01c577f2c2018-08-31 09:22:23 +010040
41 return arm_compute::CLBatchNormalizationLayer::validate(&aclInputInfo,
42 &aclOutputInfo,
43 &aclMeanInfo,
44 &aclVarInfo,
45 &aclBetaInfo,
46 &aclGammaInfo,
47 desc.m_Eps);
48}
49
arovir019e53a352018-08-31 15:26:35 +010050ClBatchNormalizationFloatWorkload::ClBatchNormalizationFloatWorkload(
telsoa014fcda012018-03-09 14:13:49 +000051 const BatchNormalizationQueueDescriptor& descriptor, const WorkloadInfo& info)
telsoa01c577f2c2018-08-31 09:22:23 +010052 : FloatWorkload<BatchNormalizationQueueDescriptor>(descriptor, info)
telsoa014fcda012018-03-09 14:13:49 +000053{
telsoa01c577f2c2018-08-31 09:22:23 +010054 m_Mean = std::make_unique<arm_compute::CLTensor>();
55 BuildArmComputeTensor(*m_Mean, m_Data.m_Mean->GetTensorInfo());
56
57 m_Variance = std::make_unique<arm_compute::CLTensor>();
58 BuildArmComputeTensor(*m_Variance, m_Data.m_Variance->GetTensorInfo());
59
60 m_Gamma = std::make_unique<arm_compute::CLTensor>();
61 BuildArmComputeTensor(*m_Gamma, m_Data.m_Gamma->GetTensorInfo());
62
63 m_Beta = std::make_unique<arm_compute::CLTensor>();
64 BuildArmComputeTensor(*m_Beta, m_Data.m_Beta->GetTensorInfo());
telsoa014fcda012018-03-09 14:13:49 +000065
arovir019e53a352018-08-31 15:26:35 +010066 m_Data.ValidateInputsOutputs("ClBatchNormalizationFloatWorkload", 1, 1);
telsoa014fcda012018-03-09 14:13:49 +000067
68 arm_compute::ICLTensor& input = static_cast<IClTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
69 arm_compute::ICLTensor& output = static_cast<IClTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
telsoa014fcda012018-03-09 14:13:49 +000070
Nikhil Rajd1340932018-10-18 14:27:50 +010071 arm_compute::DataLayout aclDataLayout = ConvertDataLayout(m_Data.m_Parameters.m_DataLayout.GetDataLayout());
72 input.info()->set_data_layout(aclDataLayout);
73 output.info()->set_data_layout(aclDataLayout);
74
telsoa01c577f2c2018-08-31 09:22:23 +010075 m_Layer.configure(&input,
76 &output,
77 m_Mean.get(),
78 m_Variance.get(),
79 m_Beta.get(),
80 m_Gamma.get(),
81 m_Data.m_Parameters.m_Eps);
82
Matthew Bentham785df502018-09-21 10:29:58 +010083 InitializeArmComputeClTensorData(*m_Mean, m_Data.m_Mean);
84 InitializeArmComputeClTensorData(*m_Variance, m_Data.m_Variance);
85 InitializeArmComputeClTensorData(*m_Beta, m_Data.m_Beta);
86 InitializeArmComputeClTensorData(*m_Gamma, m_Data.m_Gamma);
telsoa01c577f2c2018-08-31 09:22:23 +010087
88 // Force Compute Library to perform the necessary copying and reshaping, after which
89 // delete all the input tensors that will no longer be needed
90 m_Layer.prepare();
91 FreeUnusedTensors();
telsoa014fcda012018-03-09 14:13:49 +000092}
93
arovir019e53a352018-08-31 15:26:35 +010094void ClBatchNormalizationFloatWorkload::Execute() const
telsoa014fcda012018-03-09 14:13:49 +000095{
arovir019e53a352018-08-31 15:26:35 +010096 ARMNN_SCOPED_PROFILING_EVENT_CL("ClBatchNormalizationFloatWorkload_Execute");
Aron Virginas-Tara8e06ed2018-10-19 16:46:15 +010097 RunClFunction(m_Layer, CHECK_LOCATION());
telsoa014fcda012018-03-09 14:13:49 +000098}
99
arovir019e53a352018-08-31 15:26:35 +0100100void ClBatchNormalizationFloatWorkload::FreeUnusedTensors()
telsoa01c577f2c2018-08-31 09:22:23 +0100101{
102 FreeTensorIfUnused(m_Mean);
103 FreeTensorIfUnused(m_Variance);
104 FreeTensorIfUnused(m_Gamma);
105 FreeTensorIfUnused(m_Beta);
106}
107
Matthew Bentham14e46692018-09-20 15:35:30 +0100108} //namespace armnn