IVGCVSW-6440 Add profiling around CL workload configure calls
Signed-off-by: Kevin May <kevin.may@arm.com>
Change-Id: I7626d5bd82e832d5be6913719a34d76fbd1dbed8
diff --git a/src/backends/cl/workloads/ClQLstmWorkload.cpp b/src/backends/cl/workloads/ClQLstmWorkload.cpp
index d7c7af7..b2c1d6d 100644
--- a/src/backends/cl/workloads/ClQLstmWorkload.cpp
+++ b/src/backends/cl/workloads/ClQLstmWorkload.cpp
@@ -158,24 +158,27 @@
m_Data.m_Parameters.m_CellIntermediateScale,
m_Data.m_Parameters.m_OutputIntermediateScale);
- // QLSTM CL configure
- m_QLstmLayer.configure(clCompileContext,
- &input,
- m_InputToForgetWeightsTensor.get(),
- m_InputToCellWeightsTensor.get(),
- m_InputToOutputWeightsTensor.get(),
- m_RecurrentToForgetWeightsTensor.get(),
- m_RecurrentToCellWeightsTensor.get(),
- m_RecurrentToOutputWeightsTensor.get(),
- m_ForgetGateBiasTensor.get(),
- m_CellBiasTensor.get(),
- m_OutputGateBiasTensor.get(),
- &cellStateIn,
- &outputStateIn,
- &cellStateOut,
- &outputStateOut,
- &output,
- qLstmParams);
+ {
+ ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "ClQLstmWorkload_configure");
+ // QLSTM CL configure
+ m_QLstmLayer.configure(clCompileContext,
+ &input,
+ m_InputToForgetWeightsTensor.get(),
+ m_InputToCellWeightsTensor.get(),
+ m_InputToOutputWeightsTensor.get(),
+ m_RecurrentToForgetWeightsTensor.get(),
+ m_RecurrentToCellWeightsTensor.get(),
+ m_RecurrentToOutputWeightsTensor.get(),
+ m_ForgetGateBiasTensor.get(),
+ m_CellBiasTensor.get(),
+ m_OutputGateBiasTensor.get(),
+ &cellStateIn,
+ &outputStateIn,
+ &cellStateOut,
+ &outputStateOut,
+ &output,
+ qLstmParams);
+ }
// Initialise ACL tensor data for mandatory params
InitializeArmComputeClTensorData(*m_InputToForgetWeightsTensor, m_Data.m_InputToForgetWeights);