Implement MatMul Function

Resolves: COMPMID-5949
Signed-off-by: Ramy Elgammal <ramy.elgammal@arm.com>
Change-Id: Idd8cfe6ea94a14f0b23178f6781251b5f0955563
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/9390
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: Gunes Bayir <gunes.bayir@arm.com>
Benchmark: Arm Jenkins <bsgcomp@arm.com>
diff --git a/Android.bp b/Android.bp
index 5617812..f315def 100644
--- a/Android.bp
+++ b/Android.bp
@@ -741,6 +741,7 @@
         "src/gpu/cl/operators/ClGemmLowpOutputStage.cpp",
         "src/gpu/cl/operators/ClIndirectConv2d.cpp",
         "src/gpu/cl/operators/ClLogicalNot.cpp",
+        "src/gpu/cl/operators/ClMatMul.cpp",
         "src/gpu/cl/operators/ClMul.cpp",
         "src/gpu/cl/operators/ClPRelu.cpp",
         "src/gpu/cl/operators/ClPermute.cpp",
@@ -823,6 +824,7 @@
         "src/runtime/CL/functions/CLLogicalAnd.cpp",
         "src/runtime/CL/functions/CLLogicalNot.cpp",
         "src/runtime/CL/functions/CLLogicalOr.cpp",
+        "src/runtime/CL/functions/CLMatMul.cpp",
         "src/runtime/CL/functions/CLMaxUnpoolingLayer.cpp",
         "src/runtime/CL/functions/CLMeanStdDevNormalizationLayer.cpp",
         "src/runtime/CL/functions/CLNormalizationLayer.cpp",