Add Queue support

Queues are responsible for scheduling operators and performing other
runtime related activities like for example tuning.

Signed-off-by: Georgios Pinitas <georgios.pinitas@arm.com>
Change-Id: I0366d9048470d277b8cbf59fa42f95c0ae57c5c9
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/5487
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: Michele Di Giorgio <michele.digiorgio@arm.com>
Reviewed-by: Michalis Spyrou <michalis.spyrou@arm.com>
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
diff --git a/Android.bp b/Android.bp
index f542b20..78ac7f1 100644
--- a/Android.bp
+++ b/Android.bp
@@ -52,6 +52,7 @@
     export_include_dirs: [".", "./include"],
     srcs: [
         "src/c/AclContext.cpp",
+        "src/c/AclQueue.cpp",
         "src/c/AclTensor.cpp",
         "src/c/AclTensorPack.cpp",
         "src/c/AclVersion.cpp",
@@ -300,7 +301,7 @@
         "src/core/cpu/kernels/CpuDepthwiseConvolutionNativeKernel.cpp",
         "src/core/cpu/kernels/CpuDequantizationKernel.cpp",
         "src/core/cpu/kernels/CpuDirectConvolutionKernel.cpp",
-        "src/core/cpu/kernels/CpuDirectConvolutionStageKernel.cpp",
+        "src/core/cpu/kernels/CpuDirectConvolutionOutputStageKernel.cpp",
         "src/core/cpu/kernels/CpuElementwiseKernel.cpp",
         "src/core/cpu/kernels/CpuElementwiseUnaryKernel.cpp",
         "src/core/cpu/kernels/CpuFillKernel.cpp",
@@ -315,16 +316,16 @@
         "src/core/cpu/kernels/CpuSoftmaxKernel.cpp",
         "src/core/cpu/kernels/CpuSubKernel.cpp",
         "src/core/cpu/kernels/CpuTransposeKernel.cpp",
-        "src/core/cpu/kernels/activation/NEON/fp16.cpp",
-        "src/core/cpu/kernels/activation/NEON/fp32.cpp",
-        "src/core/cpu/kernels/activation/NEON/qasymm8.cpp",
-        "src/core/cpu/kernels/activation/NEON/qasymm8_signed.cpp",
-        "src/core/cpu/kernels/activation/NEON/qsymm16.cpp",
-        "src/core/cpu/kernels/activation/SVE/fp16.cpp",
-        "src/core/cpu/kernels/activation/SVE/fp32.cpp",
-        "src/core/cpu/kernels/activation/SVE/qasymm8.cpp",
-        "src/core/cpu/kernels/activation/SVE/qasymm8_signed.cpp",
-        "src/core/cpu/kernels/activation/SVE/qsymm16.cpp",
+        "src/core/cpu/kernels/activation/neon/fp16.cpp",
+        "src/core/cpu/kernels/activation/neon/fp32.cpp",
+        "src/core/cpu/kernels/activation/neon/qasymm8.cpp",
+        "src/core/cpu/kernels/activation/neon/qasymm8_signed.cpp",
+        "src/core/cpu/kernels/activation/neon/qsymm16.cpp",
+        "src/core/cpu/kernels/activation/sve/fp16.cpp",
+        "src/core/cpu/kernels/activation/sve/fp32.cpp",
+        "src/core/cpu/kernels/activation/sve/qasymm8.cpp",
+        "src/core/cpu/kernels/activation/sve/qasymm8_signed.cpp",
+        "src/core/cpu/kernels/activation/sve/qsymm16.cpp",
         "src/core/cpu/kernels/add/neon/integer.cpp",
         "src/core/cpu/kernels/add/neon/qasymm8.cpp",
         "src/core/cpu/kernels/add/neon/qasymm8_signed.cpp",
@@ -390,8 +391,10 @@
         "src/core/utils/misc/MMappedFile.cpp",
         "src/core/utils/quantization/AsymmHelpers.cpp",
         "src/cpu/CpuContext.cpp",
+        "src/cpu/CpuQueue.cpp",
         "src/cpu/CpuTensor.cpp",
         "src/gpu/cl/ClContext.cpp",
+        "src/gpu/cl/ClQueue.cpp",
         "src/gpu/cl/ClTensor.cpp",
         "src/runtime/Allocator.cpp",
         "src/runtime/BlobLifetimeManager.cpp",