Port NEGEMMLowp Part 2

Details:
Extend NEConvertQuantizedSignednessKernel
Port NEGEMMInterleave4x4Kernel to CpuGemmInterleave4x4Kernel
Port NEGEMMTranspose1xWKernel to CpuGemmTranspose1xWKernel
Port NEGEMMLowpMatrixAReductionKernel to CpuGemmLowpMatrixAReductionKernel
Port NEGEMMLowpMatrixBReductionKernel to CpuGemmLowpMatrixBReductionKernel
Port NEGEMMLowpOffsetContributionOutputStageKernel to CpuGemmLowpOffsetContributionOutputStageKernel
Port NEGEMMLowpOffsetContributionKernel to CpuGemmLowpOffsetContributionKernel

Resolves: COMPMID-4403

Change-Id: I3227f052f25e7b41d073bbea1da8a881fcd78b8e
Signed-off-by: Manuel Bottini <manuel.bottini@arm.com>
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/5875
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: Michele Di Giorgio <michele.digiorgio@arm.com>
diff --git a/filelist.json b/filelist.json
index 061c3e8..5627495 100644
--- a/filelist.json
+++ b/filelist.json
@@ -844,7 +844,7 @@
       "ConvertQuantizedSignedness": {
         "files": {
           "kernel": [
-            "src/core/NEON/kernels/NEConvertQuantizedSignednessKernel.cpp"
+            "src/core/cpu/kernels/CpuConvertQuantizedSignednessKernel.cpp"
           ]
         }
       },
@@ -1132,16 +1132,19 @@
           "GemmAssemblyDispatch"
         ],
         "files": {
-          "operator" : ["src/runtime/cpu/operators/CpuGemmLowpOutputStage.cpp"],
+          "operator" : [
+              "src/runtime/cpu/operators/CpuGemmLowpOutputStage.cpp",
+              "src/runtime/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp"
+          ],
           "kernel": [
-            "src/core/NEON/kernels/NEGEMMLowpMatrixMultiplyKernel.cpp",
             "src/core/cpu/kernels/CpuGemmLowpQuantizeDownInt32ScaleKernel.cpp",
             "src/core/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt16ScaleByFixedPointKernel.cpp",
             "src/core/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt8ScaleByFixedPointKernel.cpp",
             "src/core/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToUint8ScaleByFixedPointKernel.cpp",
-            "src/core/NEON/kernels/NEGEMMLowpReductionKernel.cpp",
-            "src/core/NEON/kernels/NEGEMMLowpOffsetContributionOutputStageKernel.cpp",
-            "src/core/NEON/kernels/NEGEMMLowpOffsetContributionKernel.cpp"
+            "src/core/cpu/kernels/CpuGemmLowpMatrixMultiplyKernel.cpp",
+            "src/core/cpu/kernels/CpuGemmLowpMatrixReductionKernel.cpp",
+            "src/core/cpu/kernels/CpuGemmLowpOffsetContributionOutputStageKernel.cpp",
+            "src/core/cpu/kernels/CpuGemmLowpOffsetContributionKernel.cpp"
           ]
         }
       },