blob: d64d9e175dc9ce3d00151f662186dc7253e949ea [file] [log] [blame]
Georgios Pinitasbdcdc392021-04-22 16:42:03 +01001{
Michalis Spyrou20fca522021-06-07 14:23:57 +01002 "common": [
3 "src/common/cpuinfo/CpuInfo.cpp",
4 "src/common/cpuinfo/CpuModel.cpp",
5 "src/common/cpuinfo/CpuIsaInfo.cpp",
6 "src/common/utils/LegacySupport.cpp",
7 "src/common/AllocatorWrapper.cpp",
8 "src/common/ITensorV2.cpp",
Georgios Pinitas41648142021-08-03 08:24:00 +01009 "src/common/TensorPack.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010010 "src/common/IOperator.cpp",
11 "src/core/AccessWindowAutoPadding.cpp",
12 "src/core/AccessWindowStatic.cpp",
13 "src/core/AccessWindowTranspose.cpp",
14 "src/core/Error.cpp",
15 "src/core/GPUTarget.cpp",
16 "src/core/Helpers.cpp",
17 "src/core/IAccessWindow.cpp",
18 "src/core/IKernel.cpp",
19 "src/core/ITensor.cpp",
20 "src/core/ITensorPack.cpp",
21 "src/core/Rounding.cpp",
22 "src/core/Size2D.cpp",
23 "src/core/SubTensorInfo.cpp",
24 "src/core/TensorInfo.cpp",
25 "src/core/Utils.cpp",
26 "src/core/Validate.cpp",
27 "src/core/Version.cpp",
28 "src/core/helpers/SoftmaxHelpers.cpp",
29 "src/core/helpers/WindowHelpers.cpp",
30 "src/core/utils/AssemblyUtils.cpp",
31 "src/core/utils/ScaleUtils.cpp",
32 "src/core/utils/helpers/fft.cpp",
33 "src/core/utils/helpers/tensor_transform.cpp",
34 "src/core/utils/io/FileHandler.cpp",
35 "src/core/utils/misc/MMappedFile.cpp",
36 "src/core/utils/quantization/AsymmHelpers.cpp",
37 "src/core/CPP/CPPTypes.cpp",
38 "src/core/CPP/kernels/CPPBoxWithNonMaximaSuppressionLimitKernel.cpp",
39 "src/core/CPP/kernels/CPPNonMaximumSuppressionKernel.cpp",
40 "src/core/CPP/kernels/CPPPermuteKernel.cpp",
41 "src/core/CPP/kernels/CPPTopKVKernel.cpp",
42 "src/core/CPP/kernels/CPPUpsampleKernel.cpp",
43 "src/runtime/Allocator.cpp",
44 "src/runtime/BlobLifetimeManager.cpp",
45 "src/runtime/BlobMemoryPool.cpp",
46 "src/runtime/ISimpleLifetimeManager.cpp",
47 "src/runtime/ITensorAllocator.cpp",
48 "src/runtime/IWeightsManager.cpp",
49 "src/runtime/IScheduler.cpp",
50 "src/runtime/Memory.cpp",
51 "src/runtime/MemoryManagerOnDemand.cpp",
52 "src/runtime/OffsetLifetimeManager.cpp",
53 "src/runtime/OffsetMemoryPool.cpp",
54 "src/runtime/OperatorTensor.cpp",
55 "src/runtime/PoolManager.cpp",
56 "src/runtime/RuntimeContext.cpp",
57 "src/runtime/Scheduler.cpp",
58 "src/runtime/SchedulerFactory.cpp",
59 "src/runtime/SchedulerUtils.cpp",
60 "src/runtime/SubTensor.cpp",
61 "src/runtime/Tensor.cpp",
62 "src/runtime/TensorAllocator.cpp",
63 "src/runtime/Utils.cpp",
64 "src/runtime/CPP/ICPPSimpleFunction.cpp",
65 "src/runtime/CPP/functions/CPPBoxWithNonMaximaSuppressionLimit.cpp",
66 "src/runtime/CPP/functions/CPPDetectionOutputLayer.cpp",
67 "src/runtime/CPP/functions/CPPDetectionPostProcessLayer.cpp",
68 "src/runtime/CPP/functions/CPPNonMaximumSuppression.cpp",
69 "src/runtime/CPP/functions/CPPPermute.cpp",
70 "src/runtime/CPP/functions/CPPTopKV.cpp",
71 "src/runtime/CPP/functions/CPPUpsample.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +010072 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +010073 "logging": [
74 "src/core/utils/logging/FilePrinter.cpp",
75 "src/core/utils/logging/Helpers.cpp",
76 "src/core/utils/logging/Logger.cpp",
77 "src/core/utils/logging/LoggerRegistry.cpp"
78 ],
79 "scheduler": {
80 "single": [ "src/runtime/CPP/SingleThreadScheduler.cpp" ],
81 "threads": [ "src/runtime/CPP/CPPScheduler.cpp" ],
82 "omp": [ "src/runtime/OMP/OMPScheduler.cpp"]
83 },
Michalis Spyrou20fca522021-06-07 14:23:57 +010084 "c_api": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +010085 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +010086 "src/c/AclContext.cpp",
Georgios Pinitas06ac6e42021-07-05 08:08:52 +010087 "src/c/AclOperator.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +010088 "src/c/AclQueue.cpp",
89 "src/c/AclTensor.cpp",
90 "src/c/AclTensorPack.cpp",
91 "src/c/AclVersion.cpp"
Georgios Pinitasbdcdc392021-04-22 16:42:03 +010092 ],
Georgios Pinitas13ef1762021-07-14 17:14:43 +010093 "cpu": [
94 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +010095 "gpu": [
96 "src/c/cl/AclOpenClExt.cpp"
Georgios Pinitas41648142021-08-03 08:24:00 +010097 ],
98 "operators":
99 [
100 "src/c/operators/AclActivation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100101 ]
102 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100103 "high_priority": [
104 "Activation",
105 "DepthwiseConv2d",
106 "Conv2d",
107 "Permute",
108 "Pool2d",
109 "Reshape"
110 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100111 "gpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100112 "common": [
113 "src/core/CL/CLCompileContext.cpp",
Giorgio Arenaba2dd822021-07-28 16:10:03 +0100114 "src/core/CL/DefaultLWSHeuristics.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100115 "src/core/CL/CLHelpers.cpp",
116 "src/core/CL/CLKernelLibrary.cpp",
117 "src/core/CL/CLUtils.cpp",
118 "src/core/CL/ICLKernel.cpp",
119 "src/core/CL/ICLSimple2DKernel.cpp",
120 "src/core/CL/ICLSimple3DKernel.cpp",
121 "src/core/CL/ICLSimpleKernel.cpp",
122 "src/core/CL/ICLTensor.cpp",
123 "src/core/CL/OpenCL.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100124 "src/gpu/cl/ClContext.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100125 "src/gpu/cl/ClKernelLibrary.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100126 "src/gpu/cl/ClQueue.cpp",
127 "src/gpu/cl/ClTensor.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100128 "src/core/CL/kernels/CLFillBorderKernel.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100129 "src/runtime/CL/CLBufferAllocator.cpp",
130 "src/runtime/CL/CLGEMMHeuristicsHandle.cpp",
131 "src/runtime/CL/CLHelpers.cpp",
132 "src/runtime/CL/CLMemory.cpp",
133 "src/runtime/CL/CLMemoryRegion.cpp",
134 "src/runtime/CL/CLOperator.cpp",
135 "src/runtime/CL/CLRuntimeContext.cpp",
136 "src/runtime/CL/CLScheduler.cpp",
137 "src/runtime/CL/CLSubTensor.cpp",
138 "src/runtime/CL/CLTensor.cpp",
139 "src/runtime/CL/CLTensorAllocator.cpp",
140 "src/runtime/CL/CLTuner.cpp",
141 "src/runtime/CL/ICLSimpleFunction.cpp",
142 "src/runtime/CL/Utils.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100143 "src/runtime/CL/mlgo/HeuristicTree.cpp",
144 "src/runtime/CL/mlgo/MLGOHeuristics.cpp",
145 "src/runtime/CL/mlgo/MLGOParser.cpp",
146 "src/runtime/CL/mlgo/Utils.cpp",
147 "src/runtime/CL/tuners/CLTuningParametersList.cpp"
148 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100149 "operators": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100150 "Activation":{
151 "files": {
152 "common": [
153 "src/gpu/cl/kernels/ClActivationKernel.cpp",
154 "src/gpu/cl/operators/ClActivation.cpp",
155 "src/runtime/CL/functions/CLActivationLayer.cpp"
156 ]
157 }
158 },
159 "ArgMinMax": {
160 "deps": [ "Reshape" ],
161 "files": {
162 "common": [
163 "src/core/CL/kernels/CLArgMinMaxLayerKernel.cpp",
164 "src/runtime/CL/functions/CLArgMinMaxLayer.cpp"
165 ]
166 }
167 },
168 "Add": {
169 "files": {
170 "common": [
171 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
172 "src/gpu/cl/operators/ClAdd.cpp"
173 ]
174 }
175 },
176 "BatchNormalization": {
177 "files": {
178 "common": [
179 "src/core/CL/kernels/CLBatchNormalizationLayerKernel.cpp",
180 "src/core/CL/kernels/CLFuseBatchNormalizationKernel.cpp",
181 "src/runtime/CL/functions/CLBatchNormalizationLayer.cpp",
182 "src/runtime/CL/functions/CLFuseBatchNormalization.cpp"
183 ]
184 }
185 },
186 "BatchToSpace": {
187 "files": {
188 "common": [
189 "src/core/CL/kernels/CLBatchToSpaceLayerKernel.cpp",
190 "src/runtime/CL/functions/CLBatchToSpaceLayer.cpp"
191 ]
192 }
193 },
194 "Bitwise": {
195 "files": {
196 "common": [ "src/core/CL/kernels/CLBitwiseKernel.cpp" ]
197 }
198 },
199 "BitwiseAnd": {
200 "deps": [ "Bitwise" ],
201 "files": {
202 "common": [ "src/runtime/CL/functions/CLBitwiseAnd.cpp" ]
203 }
204 },
205 "BitwiseNot": {
206 "deps": [ "Bitwise" ],
207 "files": {
208 "common": [ "src/runtime/CL/functions/CLBitwiseNot.cpp" ]
209 }
210 },
211 "BitwiseOr": {
212 "deps": [ "Bitwise" ],
213 "files": {
214 "common": [ "src/runtime/CL/functions/CLBitwiseOr.cpp" ]
215 }
216 },
217 "BitwiseXor": {
218 "deps": [ "Bitwise" ],
219 "files": {
220 "common": [ "src/runtime/CL/functions/CLBitwiseXor.cpp" ]
221 }
222 },
223 "BoundingBoxTransform": {
224 "files": {
225 "common": [
226 "src/core/CL/kernels/CLBoundingBoxTransformKernel.cpp",
227 "src/runtime/CL/functions/CLBoundingBoxTransform.cpp"
228 ]
229 }
230 },
231 "Cast": {
232 "files": {
233 "common": [
234 "src/gpu/cl/kernels/ClCastKernel.cpp",
235 "src/gpu/cl/operators/ClCast.cpp",
236 "src/runtime/CL/functions/CLCast.cpp"
237 ]
238 }
239 },
240 "ChannelShuffle": {
241 "files": {
242 "common": [
243 "src/core/CL/kernels/CLChannelShuffleLayerKernel.cpp",
244 "src/runtime/CL/functions/CLChannelShuffleLayer.cpp"
245 ]
246 }
247 },
248 "Comparison": {
249 "files": {
250 "common": [
251 "src/core/CL/kernels/CLComparisonKernel.cpp",
252 "src/runtime/CL/functions/CLComparison.cpp"
253 ]
254 }
255 },
256 "Concatenate": {
257 "files": {
258 "common": [
259 "src/gpu/cl/kernels/ClBatchConcatenateKernel.cpp",
260 "src/gpu/cl/kernels/ClDepthConcatenateKernel.cpp",
261 "src/gpu/cl/kernels/ClHeightConcatenateKernel.cpp",
262 "src/gpu/cl/kernels/ClWidthConcatenate2TensorsKernel.cpp",
263 "src/gpu/cl/kernels/ClWidthConcatenate4TensorsKernel.cpp",
264 "src/gpu/cl/kernels/ClWidthConcatenateKernel.cpp",
265 "src/gpu/cl/operators/ClConcatenate.cpp",
266 "src/runtime/CL/functions/CLConcatenateLayer.cpp"
267 ]
268 }
269 },
270 "Conv2d": {
271 "deps": [
272 "Activation",
273 "ElementwiseBinary",
274 "FFT2D",
275 "Gemm",
276 "Mul",
277 "Pad",
278 "Permute",
279 "Reduction",
280 "Reshape",
281 "Reverse",
282 "Slice"
283 ],
284 "files": {
285 "common": [
286 "src/gpu/cl/kernels/ClDirectConv2dKernel.cpp",
287 "src/gpu/cl/kernels/ClWinogradFilterTransformKernel.cpp",
288 "src/gpu/cl/kernels/ClWinogradInputTransformKernel.cpp",
289 "src/gpu/cl/kernels/ClWinogradOutputTransformKernel.cpp",
290 "src/gpu/cl/kernels/ClIm2ColKernel.cpp",
Gian Marco Iodice5d016812022-11-17 11:03:39 +0000291 "src/gpu/cl/kernels/ClIndirectConv2dAddressPrecalculationKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100292 "src/gpu/cl/kernels/ClCol2ImKernel.cpp",
293 "src/gpu/cl/operators/ClConv2d.cpp",
294 "src/gpu/cl/operators/ClDirectConv2d.cpp",
295 "src/gpu/cl/operators/ClGemmConv2d.cpp",
296 "src/gpu/cl/operators/ClWinogradConv2d.cpp",
297 "src/gpu/cl/kernels/ClWeightsReshapeKernel.cpp",
298 "src/runtime/CL/functions/CLConvolutionLayer.cpp",
299 "src/runtime/CL/functions/CLDirectConvolutionLayer.cpp",
300 "src/runtime/CL/functions/CLFFTConvolutionLayer.cpp",
301 "src/runtime/CL/functions/CLGEMMConvolutionLayer.cpp",
302 "src/runtime/CL/functions/CLWinogradConvolutionLayer.cpp"
303 ]
304 }
305 },
Giorgio Arena273c28c2021-10-14 15:59:15 +0100306 "Conv3d": {
307 "files": {
308 "common": [
309 "src/gpu/cl/kernels/ClDirectConv3dKernel.cpp",
310 "src/gpu/cl/operators/ClDirectConv3d.cpp",
311 "src/runtime/CL/functions/CLConv3D.cpp"
312 ]
313 }
314 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100315 "Copy": {
316 "files": {
317 "common": [
318 "src/gpu/cl/kernels/ClCopyKernel.cpp",
319 "src/gpu/cl/operators/ClCopy.cpp",
320 "src/runtime/CL/functions/CLCopy.cpp"
321 ]
322 }
323 },
324 "CropResize": {
325 "deps": [ "Copy", "Fill", "Scale" ],
326 "files": {
327 "common": [
328 "src/gpu/cl/kernels/ClCropKernel.cpp",
329 "src/gpu/cl/operators/ClCrop.cpp",
330 "src/runtime/CL/functions/CLCrop.cpp",
331 "src/runtime/CL/functions/CLCropResize.cpp"
332 ]
333 }
334 },
335 "Deconv2d": {
336 "deps": [ "Conv2d", "Reverse", "Transpose"],
337 "files": {
338 "common": [
339 "src/core/CL/kernels/CLDeconvolutionLayerUpsampleKernel.cpp",
340 "src/core/CL/kernels/CLDeconvolutionReshapeOutputKernel.cpp",
Gunes Bayirec0113d2022-11-09 09:26:27 +0000341 "src/gpu/cl/kernels/ClTransposedConvolutionKernel.cpp",
342 "src/gpu/cl/operators/ClTransposedConvolution.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100343 "src/runtime/CL/functions/CLDeconvolutionLayer.cpp",
344 "src/runtime/CL/functions/CLDeconvolutionLayerUpsample.cpp",
345 "src/runtime/CL/functions/CLDirectDeconvolutionLayer.cpp",
346 "src/runtime/CL/functions/CLGEMMDeconvolutionLayer.cpp"
347 ]
348 }
349 },
350 "DepthConvert": {
351 "deps": [ "Cast"],
352 "files": {
353 "common": [ "src/runtime/CL/functions/CLDepthConvertLayer.cpp" ]
354 }
355 },
356 "DepthToSpace": {
357 "files": {
358 "common": [
359 "src/core/CL/kernels/CLDepthToSpaceLayerKernel.cpp",
360 "src/runtime/CL/functions/CLDepthToSpaceLayer.cpp"
361 ]
362 }
363 },
364 "DepthwiseConv2d": {
365 "deps": [ "Permute" ],
366 "files": {
367 "common": [
368 "src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp",
369 "src/runtime/CL/functions/CLDepthwiseConvolutionLayer.cpp"
370 ]
371 }
372 },
373 "Dequantize": {
374 "files": {
375 "common": [
376 "src/gpu/cl/kernels/ClDequantizeKernel.cpp",
377 "src/gpu/cl/operators/ClDequantize.cpp",
378 "src/runtime/CL/functions/CLDequantizationLayer.cpp"
379 ]
380 }
381 },
382 "ElementwiseBinary": {
383 "deps": ["Add", "Sub"],
384 "files": {
385 "common": [
386 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
387 "src/gpu/cl/operators/ClElementwiseOperations.cpp",
388 "src/runtime/CL/functions/CLElementwiseOperations.cpp"
389 ]
390 }
391 },
392 "ElementwiseUnary":{
393 "files": {
394 "common": [
395 "src/gpu/cl/kernels/ClElementwiseUnaryKernel.cpp",
396 "src/gpu/cl/operators/ClElementwiseUnary.cpp",
397 "src/runtime/CL/functions/CLElementwiseUnaryLayer.cpp"
398 ]
399 }
400 },
401 "FFT1D": {
402 "files": {
403 "common": [
404 "src/core/CL/kernels/CLFFTDigitReverseKernel.cpp",
405 "src/core/CL/kernels/CLFFTRadixStageKernel.cpp",
406 "src/core/CL/kernels/CLFFTScaleKernel.cpp",
407 "src/runtime/CL/functions/CLFFT1D.cpp"
408 ]
409 }
410 },
411 "FFT2D": {
412 "deps": [ "FFT1D" ],
413 "files": {
414 "common": [ "src/runtime/CL/functions/CLFFT2D.cpp" ]
415 }
416 },
417 "Fill": {
418 "files": {
419 "common": [
420 "src/gpu/cl/kernels/ClFillKernel.cpp",
421 "src/gpu/cl/operators/ClFill.cpp",
422 "src/runtime/CL/functions/CLFill.cpp"
423 ]
424 }
425 },
426 "Flatten": {
427 "files": {
428 "common": [
429 "src/gpu/cl/operators/ClFlatten.cpp",
430 "src/runtime/CL/functions/CLFlattenLayer.cpp"
431 ]
432 }
433 },
434 "Floor": {
435 "files": {
436 "common": [
437 "src/gpu/cl/kernels/ClFloorKernel.cpp",
438 "src/gpu/cl/operators/ClFloor.cpp",
439 "src/runtime/CL/functions/CLFloor.cpp"
440 ]
441 }
442 },
443 "FullyConnected": {
444 "deps": [ "Flatten", "Gemm", "Transpose"],
445 "files": {
446 "common": [
447 "src/gpu/cl/kernels/ClConvertFullyConnectedWeightsKernel.cpp",
448 "src/gpu/cl/operators/ClConvertFullyConnectedWeights.cpp",
449 "src/gpu/cl/operators/ClFullyConnected.cpp",
450 "src/runtime/CL/functions/CLConvertFullyConnectedWeights.cpp",
451 "src/runtime/CL/functions/CLFullyConnectedLayer.cpp"
452 ]
453 }
454 },
455 "Gather": {
456 "files": {
457 "common": [
458 "src/core/CL/kernels/CLGatherKernel.cpp",
459 "src/runtime/CL/functions/CLGather.cpp"]
460 }
461 },
462 "Gemm": {
463 "deps": [ "Cast" ],
464 "files": {
465 "common": [
Gian Marco Iodice2cc50b32022-05-30 14:41:49 +0100466 "src/gpu/cl/kernels/direct_conv/ClDirectConvDefaultConfigBifrost.cpp",
467 "src/gpu/cl/kernels/direct_conv/ClDirectConvDefaultConfigValhall.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100468 "src/gpu/cl/kernels/gemm/ClGemmHelpers.cpp",
469 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeBifrost.cpp",
470 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeMidgard.cpp",
471 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeValhall.cpp",
472 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedBifrost.cpp",
473 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedValhall.cpp",
474 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyBifrost.cpp",
475 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyValhall.cpp",
476 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyNativeKernel.cpp",
477 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedKernel.cpp",
478 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsKernel.cpp",
Freddie Liardete572dff2022-05-16 14:09:10 +0100479 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100480 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionKernel.cpp",
481 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionOutputStageKernel.cpp",
482 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFixedPointKernel.cpp",
483 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFloatKernel.cpp",
484 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100485 "src/gpu/cl/kernels/ClGemmMatrixMultiplyNativeKernel.cpp",
Gunes Bayir4bfc70e2021-12-10 16:17:56 +0000486 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100487 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedKernel.cpp",
488 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsKernel.cpp",
489 "src/gpu/cl/kernels/ClGemmReshapeLhsMatrixKernel.cpp",
490 "src/gpu/cl/kernels/ClGemmReshapeRhsMatrixKernel.cpp",
491 "src/gpu/cl/kernels/ClGemmLowpReductionKernel.cpp",
492 "src/gpu/cl/operators/ClGemm.cpp",
493 "src/gpu/cl/operators/ClGemmLowpMatrixMultiplyCore.cpp",
494 "src/gpu/cl/operators/ClGemmLowpOutputStage.cpp",
495 "src/runtime/CL/gemm/CLGEMMDefaultTypeBifrost.cpp",
496 "src/runtime/CL/gemm/CLGEMMDefaultTypeMidgard.cpp",
497 "src/runtime/CL/gemm/CLGEMMDefaultTypeValhall.cpp",
498 "src/runtime/CL/gemm_auto_heuristics/CLGEMMAutoHeuristics.cpp",
499 "src/runtime/CL/functions/CLGEMM.cpp",
500 "src/runtime/CL/functions/CLGEMMLowpMatrixMultiplyCore.cpp",
501 "src/runtime/CL/functions/CLGEMMLowpOutputStage.cpp"
502 ]
503 }
504 },
505 "GenerateProposals": {
506 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
507 "files": {
508 "common": [
509 "src/core/CL/kernels/CLGenerateProposalsLayerKernel.cpp",
510 "src/runtime/CL/functions/CLGenerateProposalsLayer.cpp"
511 ]
512 }
513 },
514 "InstanceNormalize": {
515 "files": {
516 "common": [
517 "src/core/CL/kernels/CLInstanceNormalizationLayerKernel.cpp",
518 "src/runtime/CL/functions/CLInstanceNormalizationLayer.cpp"
519 ]
520 }
521 },
522 "L2Normalize": {
523 "deps": [ "Reduction" ],
524 "files": {
525 "common": [
526 "src/core/CL/kernels/CLL2NormalizeLayerKernel.cpp",
527 "src/runtime/CL/functions/CLL2NormalizeLayer.cpp"
528 ]
529 }
530 },
531 "Logical": {
532 "files": {
533 "common": [
534 "src/gpu/cl/operators/ClLogicalNot.cpp",
535 "src/runtime/CL/functions/CLLogicalAnd.cpp",
536 "src/runtime/CL/functions/CLLogicalNot.cpp",
537 "src/runtime/CL/functions/CLLogicalOr.cpp"
538 ]
539 }
540 },
541 "LSTM": {
542 "deps": [
543 "Activation",
544 "Concatenate",
545 "Copy",
546 "Dequantize",
547 "ElementwiseBinary",
548 "Fill",
549 "FullyConnected",
550 "Gemm",
551 "MeanStdDevNormalize",
552 "Mul",
553 "Quantize",
554 "Slice",
555 "Transpose"
556 ],
557 "files": {
558 "common": [
559 "src/core/CL/kernels/CLQLSTMLayerNormalizationKernel.cpp",
560 "src/runtime/CL/functions/CLQLSTMLayer.cpp",
561 "src/runtime/CL/functions/CLLSTMLayer.cpp",
562 "src/runtime/CL/functions/CLLSTMLayerQuantized.cpp"
563 ]
564 }
565 },
566 "MaxUnpool2d": {
567 "deps": [ "Fill" ],
568 "files": {
569 "common": [
570 "src/core/CL/kernels/CLMaxUnpoolingLayerKernel.cpp",
571 "src/runtime/CL/functions/CLMaxUnpoolingLayer.cpp"
572 ]
573 }
574 },
575 "MeanStdDevNormalize": {
576 "deps": [ "Reduction" ],
577 "files": {
578 "common": [
579 "src/core/CL/kernels/CLMeanStdDevNormalizationKernel.cpp",
580 "src/runtime/CL/functions/CLMeanStdDevNormalizationLayer.cpp",
581 "src/runtime/CL/functions/CLReduceMean.cpp"
582 ]
583 }
584 },
585 "Mul": {
586 "files": {
587 "common": [
588 "src/gpu/cl/kernels/ClMulKernel.cpp",
589 "src/gpu/cl/operators/ClMul.cpp",
590 "src/runtime/CL/functions/CLPixelWiseMultiplication.cpp"
591 ]
592 }
593 },
594 "Normalize": {
595 "files": {
596 "common": [
597 "src/core/CL/kernels/CLNormalizationLayerKernel.cpp",
598 "src/runtime/CL/functions/CLNormalizationLayer.cpp"
599 ]
600 }
601 },
602 "Pad": {
603 "deps": [ "Copy" ],
604 "files": {
605 "common": [
606 "src/core/CL/kernels/CLPadLayerKernel.cpp",
607 "src/runtime/CL/functions/CLPadLayer.cpp"
608 ]
609 }
610 },
611 "Permute": {
612 "files": {
613 "common": [
614 "src/gpu/cl/kernels/ClPermuteKernel.cpp",
615 "src/gpu/cl/operators/ClPermute.cpp",
616 "src/runtime/CL/functions/CLPermute.cpp"
617 ]
618 }
619 },
620 "Pool2d": {
621 "files": {
622 "common": [
623 "src/gpu/cl/kernels/ClPool2dKernel.cpp",
624 "src/gpu/cl/operators/ClPool2d.cpp",
625 "src/runtime/CL/functions/CLPoolingLayer.cpp"
626 ]
627 }
628 },
ramelg0137515692022-02-26 22:06:20 +0000629 "Pool3d": {
630 "files": {
631 "common": [
632 "src/gpu/cl/kernels/ClPool3dKernel.cpp",
633 "src/gpu/cl/operators/ClPool3d.cpp",
634 "src/runtime/CL/functions/CLPooling3dLayer.cpp"
635 ]
636 }
637 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100638 "PRelu": {
639 "deps": [ "ElementwiseBinary" ],
640 "files": {
641 "common": [
642 "src/gpu/cl/operators/ClPRelu.cpp",
643 "src/runtime/CL/functions/CLPReluLayer.cpp"
644 ]
645 }
646 },
647 "PriorBox": {
648 "files": {
649 "common": [
650 "src/core/CL/kernels/CLPriorBoxLayerKernel.cpp",
651 "src/runtime/CL/functions/CLPriorBoxLayer.cpp"
652 ]
653 }
654 },
655 "Quantize": {
656 "files": {
657 "common": [
658 "src/gpu/cl/kernels/ClQuantizeKernel.cpp",
659 "src/gpu/cl/operators/ClQuantize.cpp",
660 "src/runtime/CL/functions/CLQuantizationLayer.cpp"
661 ]
662 }
663 },
664 "Range": {
665 "files": {
666 "common": [
667 "src/core/CL/kernels/CLRangeKernel.cpp",
668 "src/runtime/CL/functions/CLRange.cpp"
669 ]
670 }
671 },
672 "Reduction": {
673 "deps": [ "Reshape" ],
674 "files": {
ramelg01a1f78512022-06-29 16:28:10 +0100675 "common": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100676 "src/core/CL/kernels/CLReductionOperationKernel.cpp",
677 "src/runtime/CL/functions/CLReductionOperation.cpp"
678 ]
679 }
680 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100681 "Reorg": {
682 "files": {
683 "common": [
684 "src/core/CL/kernels/CLReorgLayerKernel.cpp",
685 "src/runtime/CL/functions/CLReorgLayer.cpp"
686 ]
687 }
688 },
689 "Reshape": {
690 "files": {
691 "common": [
692 "src/gpu/cl/kernels/ClReshapeKernel.cpp",
693 "src/gpu/cl/operators/ClReshape.cpp",
694 "src/runtime/CL/functions/CLReshapeLayer.cpp"
695 ]
696 }
697 },
698 "Reverse": {
699 "files": {
700 "common": [
701 "src/core/CL/kernels/CLReverseKernel.cpp",
702 "src/runtime/CL/functions/CLReverse.cpp"
703 ]
704 }
705 },
706 "RNN": {
707 "deps": [ "Activation", "Cast", "ElementwiseBinary", "FullyConnected", "Gemm"],
708 "files": {
709 "common": [ "src/runtime/CL/functions/CLRNNLayer.cpp" ]
710 }
711 },
712 "ROIAlign": {
713 "files": {
714 "common": [
715 "src/core/CL/kernels/CLROIAlignLayerKernel.cpp",
716 "src/runtime/CL/functions/CLROIAlignLayer.cpp"
717 ]
718 }
719 },
720 "ROIPool2d": {
721 "files": {
722 "common": [
723 "src/core/CL/kernels/CLROIPoolingLayerKernel.cpp",
724 "src/runtime/CL/functions/CLROIPoolingLayer.cpp"
725 ]
726 }
727 },
728 "Scale": {
729 "files": {
730 "common": [
731 "src/gpu/cl/kernels/ClScaleKernel.cpp",
732 "src/gpu/cl/operators/ClScale.cpp",
733 "src/runtime/CL/functions/CLScale.cpp"
734 ]
735 }
736 },
737 "Select": {
738 "files": {
739 "common": [
740 "src/core/CL/kernels/CLSelectKernel.cpp",
741 "src/runtime/CL/functions/CLSelect.cpp"
742 ]
743 }
744 },
745 "Slice": {
746 "deps": [ "StridedSlice" ],
747 "files": {
748 "common": [ "src/runtime/CL/functions/CLSlice.cpp" ]
749 }
750 },
751 "Softmax": {
752 "deps": [ "Permute" ],
753 "files": {
754 "common": [
755 "src/gpu/cl/kernels/ClSoftmaxKernel.cpp",
756 "src/gpu/cl/operators/ClSoftmax.cpp",
757 "src/runtime/CL/functions/CLSoftmaxLayer.cpp"
758 ]
759 }
760 },
761 "SpaceToBatch": {
762 "files": {
763 "common": [
764 "src/core/CL/kernels/CLSpaceToBatchLayerKernel.cpp",
765 "src/runtime/CL/functions/CLSpaceToBatchLayer.cpp"
766 ]
767 }
768 },
769 "SpaceToDepth": {
770 "files": {
771 "common": [
772 "src/core/CL/kernels/CLSpaceToDepthLayerKernel.cpp",
773 "src/runtime/CL/functions/CLSpaceToDepthLayer.cpp"
774 ]
775 }
776 },
777 "Split": {
778 "deps": [ "StridedSlice" ],
779 "files": {
780 "common": [ "src/runtime/CL/functions/CLSplit.cpp" ]
781 }
782 },
783 "Stack": {
784 "files": {
785 "common": [
786 "src/core/CL/kernels/CLStackLayerKernel.cpp",
787 "src/runtime/CL/functions/CLStackLayer.cpp"
788 ]
789 }
790 },
791 "StridedSlice": {
792 "files": {
793 "common": [
794 "src/core/CL/kernels/CLStridedSliceKernel.cpp",
795 "src/runtime/CL/functions/CLStridedSlice.cpp"
796 ]
797 }
798 },
799 "Sub": {
800 "files": {
801 "common": [
802 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
803 "src/gpu/cl/operators/ClSub.cpp"
804 ]
805 }
806 },
807 "Tile": {
808 "files": {
809 "common": [
810 "src/core/CL/kernels/CLTileKernel.cpp",
811 "src/runtime/CL/functions/CLTile.cpp"
812 ]
813 }
814 },
815 "Transpose": {
816 "files": {
817 "common": [
818 "src/gpu/cl/kernels/ClTransposeKernel.cpp",
819 "src/gpu/cl/operators/ClTranspose.cpp",
820 "src/runtime/CL/functions/CLTranspose.cpp"
821 ]
822 }
823 },
824 "Unstack": {
825 "deps": [ "StridedSlice" ],
826 "files": {
827 "common": [ "src/runtime/CL/functions/CLUnstack.cpp" ]
828 }
829 },
830 "YUVNormalize": {
831 "files": {
832 "common": [
833 "src/core/CL/kernels/CLNormalizePlanarYUVLayerKernel.cpp",
834 "src/runtime/CL/functions/CLNormalizePlanarYUVLayer.cpp"
835 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100836 }
Georgios Pinitasbdcdc392021-04-22 16:42:03 +0100837 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100838 }
839},
Michalis Spyrou20fca522021-06-07 14:23:57 +0100840 "cpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100841 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +0100842 "src/cpu/CpuContext.cpp",
843 "src/cpu/CpuQueue.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100844 "src/cpu/CpuTensor.cpp",
845 "src/core/NEON/kernels/NEFillBorderKernel.cpp",
846 "src/runtime/NEON/INEOperator.cpp",
847 "src/runtime/NEON/INESimpleFunction.cpp",
848 "src/runtime/NEON/INESimpleFunctionNoBorder.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100849 ],
850 "operators": {
851 "Activation": {
852 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100853 "common": [
854 "src/cpu/operators/CpuActivation.cpp",
855 "src/cpu/kernels/CpuActivationKernel.cpp",
Dana Zlotnika538ae52022-02-21 13:12:41 +0200856 "src/runtime/NEON/functions/NEActivationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100857 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100858 "neon": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200859 "fp16": [ "src/cpu/kernels/activation/generic/neon/fp16.cpp" ],
ramelg01c827e992022-04-08 03:52:28 +0100860 "fp32": [ "src/cpu/kernels/activation/generic/neon/fp32.cpp" ],
Viet-Hoa Do29db3d22022-08-10 11:56:49 +0100861 "qasymm8": [
862 "src/cpu/kernels/activation/generic/neon/qasymm8.cpp",
863 "src/cpu/kernels/activation/generic/neon/lut.cpp"
864 ],
865 "qasymm8_signed": [
866 "src/cpu/kernels/activation/generic/neon/qasymm8_signed.cpp",
867 "src/cpu/kernels/activation/generic/neon/lut.cpp"
868 ],
Dana Zlotnika538ae52022-02-21 13:12:41 +0200869 "qsymm16": [ "src/cpu/kernels/activation/generic/neon/qsymm16.cpp" ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100870 },
871 "sve": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200872 "fp16": [ "src/cpu/kernels/activation/generic/sve/fp16.cpp" ],
Pablo Marquez Tellod1586092022-06-10 14:37:10 +0100873 "fp32": [ "src/cpu/kernels/activation/generic/sve/fp32.cpp" ],
874 "qasymm8": ["src/cpu/kernels/activation/generic/sve/lut.cpp"]
ramelg01c827e992022-04-08 03:52:28 +0100875 },
alerah01c9e519d2022-01-31 19:04:10 +0200876 "sve2":{
Dana Zlotnik32291712021-11-25 09:58:27 +0200877 "qasymm8": [ "src/cpu/kernels/activation/generic/sve2/qasymm8.cpp" ],
878 "qasymm8_signed": [ "src/cpu/kernels/activation/generic/sve2/qasymm8_signed.cpp" ],
879 "qsymm16": [ "src/cpu/kernels/activation/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100880 }
881 }
882 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100883 "ArgMinMax": {
884 "deps": [ "Reduction" ],
885 "files": {
886 "common": [ "src/runtime/NEON/functions/NEArgMinMaxLayer.cpp" ]
887 }
888 },
Michalis Spyrou20fca522021-06-07 14:23:57 +0100889 "Add": {
890 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100891 "common": [
892 "src/cpu/operators/CpuAdd.cpp",
893 "src/cpu/kernels/CpuAddKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200894 "src/runtime/NEON/functions/NEArithmeticAddition.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100895 ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200896 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200897 "common": ["src/cpu/kernels/add/generic/neon/impl.cpp"],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200898 "fp32":["src/cpu/kernels/add/generic/neon/fp32.cpp"],
899 "fp16":["src/cpu/kernels/add/generic/neon/fp16.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200900 "integer":["src/cpu/kernels/add/generic/neon/integer.cpp"],
901 "qasymm8": ["src/cpu/kernels/add/generic/neon/qasymm8.cpp"],
902 "qasymm8_signed": ["src/cpu/kernels/add/generic/neon/qasymm8_signed.cpp"],
903 "qsymm16": ["src/cpu/kernels/add/generic/neon/qsymm16.cpp"]
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200904 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100905 "sve": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200906 "common": [ "src/cpu/kernels/add/generic/sve/impl.cpp" ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200907 "integer":["src/cpu/kernels/add/generic/sve/integer.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200908 "fp32":["src/cpu/kernels/add/generic/sve/fp32.cpp"],
909 "fp16":["src/cpu/kernels/add/generic/sve/fp16.cpp"]
910 },
911 "sve2": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200912 "qasymm8": [ "src/cpu/kernels/add/generic/sve2/qasymm8.cpp" ],
913 "qasymm8_signed": [ "src/cpu/kernels/add/generic/sve2/qasymm8_signed.cpp" ],
914 "qsymm16": [ "src/cpu/kernels/add/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100915 }
916 }
917 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100918 "BatchNormalize": {
Michalis Spyrou20fca522021-06-07 14:23:57 +0100919 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100920 "common": [
921 "src/core/NEON/kernels/NEBatchNormalizationLayerKernel.cpp",
922 "src/core/NEON/kernels/NEFuseBatchNormalizationKernel.cpp",
923 "src/runtime/NEON/functions/NEBatchNormalizationLayer.cpp",
924 "src/runtime/NEON/functions/NEFuseBatchNormalization.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100925 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100926 "neon": {
Yair Schwarzbaum41a729e2021-11-15 20:42:47 +0200927 "common": [
928 "src/cpu/kernels/fuse_batch_normalization/generic/impl.cpp",
929 "src/cpu/kernels/fuse_batch_normalization/nchw/all.cpp",
930 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/impl.cpp"
931 ],
932 "fp16": [
933 "src/cpu/kernels/fuse_batch_normalization/generic/fp16.cpp",
934 "src/core/NEON/kernels/batchnormalization/impl/NEON/fp16.cpp",
935 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp16.cpp"
936 ],
937 "fp32": [
938 "src/cpu/kernels/fuse_batch_normalization/generic/fp32.cpp",
939 "src/core/NEON/kernels/batchnormalization/impl/NEON/fp32.cpp",
940 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp32.cpp"
941 ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100942 },
943 "sve": {
944 "fp16": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp16.cpp" ],
945 "fp32": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp32.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100946 }
947 }
948 },
949 "BatchToSpace": {
950 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100951 "common": [
952 "src/core/NEON/kernels/NEBatchToSpaceLayerKernel.cpp",
953 "src/runtime/NEON/functions/NEBatchToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100954 ]
955 }
956 },
957 "BitwiseAnd": {
958 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100959 "common": [
960 "src/core/NEON/kernels/NEBitwiseAndKernel.cpp",
961 "src/runtime/NEON/functions/NEBitwiseAnd.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100962 ]
963 }
964 },
965 "BitwiseNot": {
966 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100967 "common": [
968 "src/core/NEON/kernels/NEBitwiseNotKernel.cpp",
969 "src/runtime/NEON/functions/NEBitwiseNot.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100970 ]
971 }
972 },
973 "BitwiseOr": {
974 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100975 "common": [
976 "src/core/NEON/kernels/NEBitwiseOrKernel.cpp",
977 "src/runtime/NEON/functions/NEBitwiseOr.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100978 ]
979 }
980 },
981 "BitwiseXor": {
982 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100983 "common": [
984 "src/core/NEON/kernels/NEBitwiseXorKernel.cpp",
985 "src/runtime/NEON/functions/NEBitwiseXor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100986 ]
987 }
988 },
989 "BoundingBoxTransform": {
990 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100991 "common": [
992 "src/core/NEON/kernels/NEBoundingBoxTransformKernel.cpp",
993 "src/runtime/NEON/functions/NEBoundingBoxTransform.cpp"
Dana Zlotnik3475ffe2022-01-03 14:37:10 +0200994 ],
995 "neon":{
996 "common":["src/cpu/kernels/boundingboxtransform/generic/neon/impl.cpp"],
997 "fp32":["src/cpu/kernels/boundingboxtransform/generic/neon/fp32.cpp"],
998 "fp16":["src/cpu/kernels/boundingboxtransform/generic/neon/fp16.cpp"],
999 "qsymm16":["src/cpu/kernels/boundingboxtransform/generic/neon/qsymm16.cpp"]
Dana Zlotnik3475ffe2022-01-03 14:37:10 +02001000 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001001 }
1002 },
1003 "Cast": {
1004 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001005 "common": [
1006 "src/cpu/operators/CpuCast.cpp",
1007 "src/cpu/kernels/CpuCastKernel.cpp",
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +02001008 "src/runtime/NEON/functions/NECast.cpp",
1009 "src/cpu/kernels/cast/generic/neon/bfloat16.cpp"
1010 ],
1011 "neon":{
1012 "fp16":["src/cpu/kernels/cast/generic/neon/fp16.cpp"]
1013 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001014 }
1015 },
1016 "ChannelShuffle": {
1017 "files": {
1018 "common": [
1019 "src/core/NEON/kernels/NEChannelShuffleLayerKernel.cpp",
1020 "src/runtime/NEON/functions/NEChannelShuffleLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001021 ]
1022 }
1023 },
1024 "Concatenate": {
1025 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001026 "common": [
1027 "src/cpu/operators/CpuConcatenate.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001028 "src/cpu/kernels/CpuConcatenateWidthKernel.cpp",
1029 "src/cpu/kernels/CpuConcatenateBatchKernel.cpp",
1030 "src/cpu/kernels/CpuConcatenateDepthKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001031 "src/cpu/kernels/CpuConcatenateHeightKernel.cpp",
1032 "src/runtime/NEON/functions/NEConcatenateLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001033 ]
1034 }
1035 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001036 "Conv2d": {
1037 "deps": [
1038 "Activation",
1039 "ElementwiseBinary",
1040 "FFT2D",
1041 "Gemm",
1042 "Mul",
1043 "Pad",
1044 "Permute",
1045 "Reshape",
1046 "Reverse",
1047 "Slice"
1048 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001049 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001050 "common": [
1051 "src/cpu/operators/CpuConv2d.cpp",
1052 "src/cpu/operators/CpuDirectConv2d.cpp",
1053 "src/cpu/operators/CpuGemmDirectConv2d.cpp",
1054 "src/cpu/operators/CpuGemmConv2d.cpp",
1055 "src/cpu/operators/CpuWinogradConv2d.cpp",
1056 "src/cpu/operators/internal/CpuGemmAssemblyDispatch.cpp",
1057 "src/cpu/kernels/CpuDirectConv2dKernel.cpp",
1058 "src/cpu/kernels/CpuDirectConv2dOutputStageKernel.cpp",
1059 "src/cpu/kernels/CpuWinogradConv2dKernel.cpp",
1060 "src/cpu/kernels/CpuCol2ImKernel.cpp",
1061 "src/cpu/kernels/CpuIm2ColKernel.cpp",
1062 "src/cpu/kernels/CpuWeightsReshapeKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001063 "src/runtime/NEON/functions/NEConvolutionLayer.cpp",
1064 "src/runtime/NEON/functions/NEDirectConvolutionLayer.cpp",
1065 "src/runtime/NEON/functions/NEFFTConvolutionLayer.cpp",
1066 "src/runtime/NEON/functions/NEGEMMConv2d.cpp",
1067 "src/runtime/NEON/functions/NEGEMMConvolutionLayer.cpp",
1068 "src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001069 ],
1070 "neon": {
1071 "common": [
1072 "src/core/NEON/kernels/convolution/common/padding.cpp",
1073 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1074 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1075 "src/core/NEON/kernels/convolution/common/utils.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001076 "src/core/NEON/kernels/convolution/winograd/input_transforms_fp16.cpp",
1077 "src/core/NEON/kernels/convolution/winograd/input_transforms_fp32.cpp",
1078 "src/core/NEON/kernels/convolution/winograd/output_transforms_fp16.cpp",
1079 "src/core/NEON/kernels/convolution/winograd/output_transforms_fp32.cpp",
1080 "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp16.cpp",
1081 "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp32.cpp",
1082 "src/core/NEON/kernels/convolution/winograd/winograd_fp16.cpp",
1083 "src/core/NEON/kernels/convolution/winograd/winograd_fp32.cpp",
1084 "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp16_6x6.cpp",
1085 "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp32_6x6.cpp",
1086 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_1x8.cpp",
1087 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_4x4.cpp",
1088 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_6x6.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001089 "src/core/NEON/kernels/convolution/winograd/output_transforms/a64_fp16_4x4_3x3.cpp",
1090 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x2_1x7.cpp",
1091 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x4_1x5.cpp",
1092 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x6_1x3.cpp",
1093 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_3x3.cpp",
1094 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_5x5.cpp",
1095 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_4x4_3x3.cpp",
1096 "src/core/NEON/kernels/convolution/winograd/weight_transforms/a64_fp16_4x4_3x3.cpp",
1097 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_3x3.cpp",
1098 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_5x5.cpp",
1099 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_4x4_3x3.cpp",
1100 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x2_1x7.cpp",
1101 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x4_1x5.cpp",
1102 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x6_1x3.cpp",
alerah01c9e519d2022-01-31 19:04:10 +02001103 "src/cpu/kernels/directconv2d/nhwc/neon/impl.cpp",
1104 "src/cpu/kernels/directconv2d/nchw/all.cpp"
1105 ],
1106 "fp32": [
1107 "src/cpu/kernels/directconv2d/nhwc/neon/fp32.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001108 ]
ramelg0199c46472022-07-15 13:08:39 +01001109 },
1110 "sve": {
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001111 "common": [
1112 "src/core/NEON/kernels/convolution/winograd/input_transforms/sve_fp32_6x6.cpp",
1113 "src/core/NEON/kernels/convolution/winograd/input_transforms/sme_fp32_mla_6x6.cpp",
1114 "src/core/NEON/kernels/convolution/winograd/output_transforms/sme_fp32_mopa_4x4_3x3.cpp"
1115 ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001116 }
Michalis Spyroub55f8e82021-07-22 11:23:11 +01001117 }
1118 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001119 "Copy": {
1120 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001121 "common": [
1122 "src/cpu/operators/CpuCopy.cpp",
1123 "src/cpu/kernels/CpuCopyKernel.cpp",
1124 "src/runtime/NEON/functions/NECopy.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001125 ]
1126 }
1127 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001128 "CropResize": {
1129 "deps": [ "Scale" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001130 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001131 "common": [
1132 "src/core/NEON/kernels/NECropKernel.cpp",
1133 "src/runtime/NEON/functions/NECropResize.cpp"
alerah0127619932021-11-24 17:21:43 +02001134 ],
1135 "neon": {
1136 "common": [ "src/cpu/kernels/crop/generic/neon/impl.cpp" ],
1137 "fp32": [ "src/cpu/kernels/crop/generic/neon/fp32.cpp" ],
1138 "fp16": [ "src/cpu/kernels/crop/generic/neon/fp16.cpp" ],
1139 "integer": [ "src/cpu/kernels/crop/generic/neon/integer.cpp" ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001140 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001141 }
1142 },
1143 "Deconv2d": {
1144 "deps": [ "Conv2d", "Reverse", "Transpose"],
1145 "files": {
1146 "common": [
1147 "src/runtime/NEON/functions/NEDeconvolutionLayer.cpp"
1148 ]
1149 }
1150 },
1151 "DepthConvert": {
1152 "deps": [ "Cast"],
1153 "files": {
1154 "common": [
1155 "src/runtime/NEON/functions/NEDepthConvertLayer.cpp"
1156 ]
1157 }
1158 },
1159 "DepthToSpace": {
1160 "files": {
1161 "common": [
1162 "src/core/NEON/kernels/NEDepthToSpaceLayerKernel.cpp",
1163 "src/runtime/NEON/functions/NEDepthToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001164 ]
1165 }
1166 },
1167 "DepthwiseConv2d": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001168 "deps": [ "Activation", "Permute" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001169 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001170 "common": [
Georgios Pinitas7891a732021-08-20 21:39:25 +01001171 "src/cpu/operators/CpuDepthwiseConv2d.cpp",
1172 "src/cpu/operators/CpuDepthwiseConv2dAssemblyDispatch.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001173 "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.cpp",
1174 "src/cpu/kernels/internal/CpuDepthwiseConv2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001175 "src/runtime/NEON/functions/NEDepthwiseConvolutionLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001176 ],
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001177 "neon": {
1178 "common": [
1179 "src/core/NEON/kernels/convolution/common/padding.cpp",
1180 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1181 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1182 "src/core/NEON/kernels/convolution/common/utils.cpp",
ramelg01c827e992022-04-08 03:52:28 +01001183 "src/core/NEON/kernels/arm_conv/addressing.cpp",
ramelg018a164882022-04-07 02:42:52 +01001184 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_strategies_common.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001185 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8q.cpp",
1186 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8s8u8q.cpp",
1187 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/8b_mla.cpp",
1188 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_s8q.cpp",
1189 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp32.cpp",
1190 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1191 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1192 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1193 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1194 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1195 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1196 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1197 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1198 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1199 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1200 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
ramelg018a164882022-04-07 02:42:52 +01001201 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp16.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001202 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1203 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1204 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1205 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1206 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1207 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1208 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1209 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1210 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1211 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1212 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1213 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1214 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1215 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1216 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1217 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1218 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1219 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1220 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1221 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1222 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1223 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1224 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1225 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1226 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1227 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1228 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1229 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1230 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1231 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1232 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1233 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1234 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1235 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1236 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1237 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1238 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
ramelg018a164882022-04-07 02:42:52 +01001239 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1240 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1241 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001242 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_s8q_3x3_dot.cpp",
ramelg01c827e992022-04-08 03:52:28 +01001243 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_u8q_3x3_dot.cpp",
ramelg018a164882022-04-07 02:42:52 +01001244 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic.cpp",
1245 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic_quantized_dot_product.cpp",
Dana Zlotnikebbae942022-02-03 12:52:15 +02001246 "src/cpu/kernels/depthwiseconv2d/generic/neon/impl.cpp"
ramelg01a1f78512022-06-29 16:28:10 +01001247 ],
Dana Zlotnikebbae942022-02-03 12:52:15 +02001248 "fp16":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp16.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01001249 "fp32":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp32.cpp"],
1250 "qasymm8":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8.cpp"],
Dana Zlotnikebbae942022-02-03 12:52:15 +02001251 "qasymm8_signed":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8_signed.cpp"]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001252 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001253 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001254 "common": [
Freddie Liardetd216f572021-08-03 15:57:32 +01001255 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_8b_mla.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001256 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_s8q_3x3_dot.cpp",
1257 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_u8q_3x3_dot.cpp",
1258 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1259 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1260 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1261 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1262 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1263 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1264 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1265 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1266 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1267 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1268 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1269 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1270 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1271 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst_strided/generic.cpp",
1272 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1273 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1274 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1275 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1276 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1277 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1278 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1279 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1280 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1281 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1282 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1283 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1284 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1285 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1286 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1287 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1288 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1289 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1290 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1291 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1292 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1293 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1294 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1295 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1296 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1297 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1298 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001299 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1300 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1301 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1302 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1303 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1304 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1305 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1306 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1307 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1308 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s1_4rows_mla_za/generic.cpp",
1309 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s2_4rows_mla_za/generic.cpp",
1310 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s1_4rows_mla_za/generic.cpp",
1311 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s2_4rows_mla_za/generic.cpp",
1312 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za/generic.cpp",
1313 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za/generic.cpp",
1314 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za/generic.cpp",
1315 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za/generic.cpp",
1316 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
1317 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s2_2rows_dot_za/generic.cpp",
1318 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1319 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1320 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1321 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
1322 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s2_2rows_dot_za/generic.cpp",
1323 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1324 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1325 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1326 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
1327 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s2_2rows_dot_za/generic.cpp",
1328 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1329 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1330 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001331 ]
1332 }
1333 }
1334 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001335 "Dequantize": {
1336 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001337 "common": [
1338 "src/cpu/operators/CpuDequantize.cpp",
1339 "src/cpu/kernels/CpuDequantizeKernel.cpp",
1340 "src/runtime/NEON/functions/NEDequantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001341 ]
1342 }
1343 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001344 "DetectionPostProcess": {
1345 "deps": [ "Dequantize" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001346 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001347 "common" : [ "src/runtime/NEON/functions/NEDetectionPostProcessLayer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001348 }
1349 },
Sheri Zhang6d9c9822021-09-24 16:02:57 +01001350 "Conv3d": {
1351 "deps": [
1352 "Activation"
1353 ],
1354 "files": {
1355 "common": [
1356 "src/cpu/operators/CpuDirectConv3d.cpp",
1357 "src/cpu/kernels/CpuDirectConv3dKernel.cpp",
1358 "src/runtime/NEON/functions/NEConv3D.cpp"
1359 ]
1360 }
1361 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001362 "ElementwiseBinary": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001363 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001364 "common": [
1365 "src/cpu/operators/CpuElementwise.cpp",
1366 "src/cpu/kernels/CpuElementwiseKernel.cpp",
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001367 "src/runtime/NEON/functions/NEElementwiseOperations.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001368 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001369 "neon":{
1370 "fp32": ["src/cpu/kernels/elementwise_binary/generic/neon/fp32.cpp"],
1371 "fp16": ["src/cpu/kernels/elementwise_binary/generic/neon/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001372 "integer": ["src/cpu/kernels/elementwise_binary/generic/neon/integer.cpp"],
1373 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8.cpp"],
1374 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001375 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001376 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001377 "common": ["src/cpu/kernels/elementwise_binary/generic/sve/impl.cpp" ],
1378 "integer": ["src/cpu/kernels/elementwise_binary/generic/sve/integer.cpp"],
1379 "fp32": ["src/cpu/kernels/elementwise_binary/generic/sve/fp32.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001380 "fp16": ["src/cpu/kernels/elementwise_binary/generic/sve/fp16.cpp"]
1381
ramelg01a1f78512022-06-29 16:28:10 +01001382 },
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001383 "sve2":{
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001384 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8.cpp"],
1385 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001386 }
1387 }
1388 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001389 "ElementwiseUnary":{
Michalis Spyrou20fca522021-06-07 14:23:57 +01001390 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001391 "common": [
1392 "src/cpu/operators/CpuElementwiseUnary.cpp",
1393 "src/cpu/kernels/CpuElementwiseUnaryKernel.cpp",
1394 "src/runtime/NEON/functions/NEElementwiseUnaryLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001395 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001396 "neon": {
Dana Zlotnika538ae52022-02-21 13:12:41 +02001397 "common":["src/cpu/kernels/elementwise_unary/generic/neon/impl.cpp"],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001398 "integer": ["src/cpu/kernels/elementwise_unary/generic/neon/integer.cpp"],
1399 "fp32": ["src/cpu/kernels/elementwise_unary/generic/neon/fp32.cpp"],
1400 "fp16": ["src/cpu/kernels/elementwise_unary/generic/neon/fp16.cpp"]
1401 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001402 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001403 "common": ["src/cpu/kernels/elementwise_unary/generic/sve/impl.cpp" ],
1404 "integer": ["src/cpu/kernels/elementwise_unary/generic/sve/integer.cpp"],
1405 "fp32": ["src/cpu/kernels/elementwise_unary/generic/sve/fp32.cpp"],
1406 "fp16": ["src/cpu/kernels/elementwise_unary/generic/sve/fp16.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001407 }
1408 }
1409 },
1410 "FFT1D": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001411 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001412 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001413 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001414 "src/core/NEON/kernels/NEFFTDigitReverseKernel.cpp",
1415 "src/core/NEON/kernels/NEFFTRadixStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001416 "src/core/NEON/kernels/NEFFTScaleKernel.cpp",
1417 "src/runtime/NEON/functions/NEFFT1D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001418 ]
1419 }
1420 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001421 "FFT2D": {
1422 "deps": [ "FFT1D" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001423 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001424 "common": [
1425 "src/runtime/NEON/functions/NEFFT2D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001426 ]
1427 }
1428 },
1429 "Fill": {
1430 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001431 "common": [
1432 "src/cpu/operators/CpuFill.cpp",
1433 "src/cpu/kernels/CpuFillKernel.cpp",
1434 "src/runtime/NEON/functions/NEFill.cpp"
1435 ]
1436 }
1437 },
1438 "Flatten": {
1439 "deps: ": [ "Reshape" ],
1440 "files": {
1441 "common": [
1442 "src/cpu/operators/CpuFlatten.cpp",
1443 "src/runtime/NEON/functions/NEFlattenLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001444 ]
1445 }
1446 },
1447 "Floor": {
1448 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001449 "common": [
1450 "src/cpu/operators/CpuFloor.cpp",
1451 "src/cpu/kernels/CpuFloorKernel.cpp",
1452 "src/runtime/NEON/functions/NEFloor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001453 ],
1454 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001455 "fp32": [ "src/cpu/kernels/floor/neon/fp32.cpp" ],
1456 "fp16": [ "src/cpu/kernels/floor/neon/fp16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001457 }
1458 }
1459 },
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001460 "FullyConnected": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001461 "deps": [ "Flatten", "Gemm", "Transpose"],
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001462 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001463 "common": [
1464 "src/cpu/kernels/CpuConvertFullyConnectedWeightsKernel.cpp",
1465 "src/cpu/operators/CpuConvertFullyConnectedWeights.cpp",
1466 "src/cpu/operators/CpuFullyConnected.cpp",
1467 "src/runtime/NEON/functions/NEConvertFullyConnectedWeights.cpp",
1468 "src/runtime/NEON/functions/NEFullyConnectedLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001469 ]
1470 }
1471 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001472 "Gather": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001473 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001474 "common": [
1475 "src/core/NEON/kernels/NEGatherKernel.cpp",
1476 "src/runtime/NEON/functions/NEGather.cpp"
1477 ]
1478 }
1479 },
1480 "Gemm": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001481 "deps": [ "Quantize", "Add"],
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001482 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001483 "common": [
1484 "src/cpu/kernels/CpuConvertQuantizedSignednessKernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001485 "src/cpu/kernels/CpuGemmMatrixAdditionKernel.cpp",
1486 "src/cpu/kernels/CpuGemmMatrixMultiplyKernel.cpp",
1487 "src/cpu/kernels/CpuGemmTranspose1xWKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001488 "src/cpu/kernels/CpuGemmInterleave4x4Kernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001489 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ScaleKernel.cpp",
1490 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt16ScaleByFixedPointKernel.cpp",
1491 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt8ScaleByFixedPointKernel.cpp",
1492 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToUint8ScaleByFixedPointKernel.cpp",
1493 "src/cpu/kernels/CpuGemmLowpMatrixMultiplyKernel.cpp",
1494 "src/cpu/kernels/CpuGemmLowpMatrixReductionKernel.cpp",
1495 "src/cpu/kernels/CpuGemmLowpOffsetContributionOutputStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001496 "src/cpu/kernels/CpuGemmLowpOffsetContributionKernel.cpp",
1497 "src/cpu/operators/CpuGemm.cpp",
1498 "src/cpu/operators/CpuGemmLowpOutputStage.cpp",
1499 "src/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001500 "src/runtime/NEON/functions/NEGEMM.cpp",
1501 "src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001502 "src/runtime/NEON/functions/NEGEMMLowpOutputStage.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001503 ],
1504 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001505 "common": [
1506 "src/core/NEON/kernels/arm_gemm/gemm_bf16.cpp",
1507 "src/core/NEON/kernels/arm_gemm/gemm_fp16.cpp",
1508 "src/core/NEON/kernels/arm_gemm/gemm_fp32.cpp",
1509 "src/core/NEON/kernels/arm_gemm/gemm_int16.cpp",
1510 "src/core/NEON/kernels/arm_gemm/gemm_int8.cpp",
1511 "src/core/NEON/kernels/arm_gemm/gemm_qint8.cpp",
1512 "src/core/NEON/kernels/arm_gemm/gemm_quint8.cpp",
1513 "src/core/NEON/kernels/arm_gemm/gemm_uint16.cpp",
1514 "src/core/NEON/kernels/arm_gemm/gemm_uint8.cpp",
1515 "src/core/NEON/kernels/arm_gemm/interleave_indirect.cpp",
1516 "src/core/NEON/kernels/arm_gemm/mergeresults-fp16.cpp",
1517 "src/core/NEON/kernels/arm_gemm/mergeresults.cpp",
1518 "src/core/NEON/kernels/arm_gemm/misc.cpp",
1519 "src/core/NEON/kernels/arm_gemm/quantized.cpp",
1520 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_s8.cpp",
1521 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_u8.cpp",
1522 "src/core/NEON/kernels/arm_gemm/transform.cpp",
1523 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s16_8x12/generic.cpp",
1524 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_4x4/generic.cpp",
1525 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/a55r1.cpp",
1526 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/generic.cpp",
1527 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/x1.cpp",
1528 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u16_8x12/generic.cpp",
1529 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4/generic.cpp",
1530 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/a55r1.cpp",
1531 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/generic.cpp",
1532 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/x1.cpp",
1533 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/a55r1.cpp",
1534 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/generic.cpp",
1535 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/x1.cpp",
1536 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_dot_6x16/generic.cpp",
1537 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_mmla_6x16/generic.cpp",
1538 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/a55.cpp",
1539 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/generic.cpp",
1540 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/a55.cpp",
1541 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/generic.cpp",
1542 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/a55.cpp",
1543 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/generic.cpp",
1544 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/a55.cpp",
1545 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/generic.cpp",
1546 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1547 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_6x16/generic.cpp",
1548 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/a55.cpp",
1549 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/generic.cpp",
1550 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_mmla_4x16/generic.cpp",
1551 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/a55.cpp",
1552 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/generic.cpp",
1553 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_mmla_6x16/generic.cpp",
1554 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/a55.cpp",
1555 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/generic.cpp",
1556 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_mmla_6x16/generic.cpp",
1557 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/a55.cpp",
1558 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/generic.cpp",
1559 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_mmla_4x16/generic.cpp",
1560 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/a55.cpp",
1561 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/generic.cpp",
1562 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_mmla_6x16/generic.cpp",
1563 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/generic.cpp",
1564 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/x1.cpp",
1565 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/generic.cpp",
1566 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/a510.cpp",
1567 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/generic.cpp",
1568 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/a510.cpp",
1569 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/generic.cpp",
1570 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/a510.cpp",
1571 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a53.cpp",
1572 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55.cpp",
1573 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55r1.cpp",
1574 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/generic.cpp",
1575 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/x1.cpp",
1576 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x6/generic.cpp",
1577 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_6x4/generic.cpp",
1578 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_8x4/generic.cpp",
1579 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/a55.cpp",
1580 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/generic.cpp",
1581 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/a55.cpp",
1582 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/generic.cpp",
1583 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/a55.cpp",
1584 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/generic.cpp",
1585 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/a55.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001586 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/generic.cpp",
Dana Zlotnik256ac622022-02-02 15:06:11 +02001587 "src/cpu/kernels/gemm_matrix_mul/generic/neon/impl.cpp",
1588 "src/cpu/kernels/gemm_matrix_add/generic/neon/impl.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001589 ],
Dana Zlotnik256ac622022-02-02 15:06:11 +02001590 "fp32":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp32.cpp",
1591 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp32.cpp"],
1592 "fp16":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp16.cpp",
1593 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp16.cpp"],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001594 "estate32": [
1595 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a53.cpp",
1596 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a55r1.cpp",
1597 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/generic.cpp"
1598 ],
1599 "estate64": [
Freddie Liardet487d3902021-09-21 12:36:43 +01001600 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemv_pretransposed/generic.cpp"
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001601 ],
1602 "experimental_fixed_format_kernels": [
1603 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_bf16fp32_mmla_6x16/generic.cpp",
1604 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp16_mla_6x32/generic.cpp",
1605 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32_mla_6x16/generic.cpp",
1606 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1607 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_dot_8x12/generic.cpp",
1608 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_mmla_8x12/generic.cpp",
1609 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp16_mla_8x24/generic.cpp",
1610 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp32_mla_8x12/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001611 ]
1612 },
1613 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001614 "common": [
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001615 "src/core/NEON/kernels/arm_gemm/interleave_indirect-sve.cpp",
1616 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_bf16fp32_dot_16VL/generic.cpp",
1617 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32_mla_16VL/generic.cpp",
1618 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32bf16fp32_dot_16VL/generic.cpp",
1619 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_s8qa_dot_16VL/generic.cpp",
1620 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_u8qa_dot_16VL/generic.cpp",
1621 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_1VLx4VL/generic.cpp",
1622 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_2VLx2VL/generic.cpp",
1623 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_4VLx1VL/generic.cpp",
1624 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_1VLx4VL/generic.cpp",
1625 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_2VLx2VL/generic.cpp",
1626 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_4VLx1VL/generic.cpp",
1627 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_1VLx4VL/generic.cpp",
1628 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_2VLx2VL/generic.cpp",
1629 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_4VLx1VL/generic.cpp",
1630 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_1VLx4VL/generic.cpp",
1631 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_2VLx2VL/generic.cpp",
1632 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_4VLx1VL/generic.cpp",
1633 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_1VLx4VL/generic.cpp",
1634 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_2VLx2VL/generic.cpp",
1635 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_4VLx1VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001636 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001637 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1638 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001639 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001640 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001641 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001642 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001643 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001644 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1645 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001646 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001647 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_mmla_4x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001648 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001649 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_mmla_6x4VL/generic.cpp",
1650 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001651 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001652 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001653 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001654 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_mmla_4x4VL/generic.cpp",
1655 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001656 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001657 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001658 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_dot_8x3VL/generic.cpp",
1659 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001660 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001661 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001662 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001663 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/generic.cpp",
1664 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001665 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001666 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/generic.cpp",
1667 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001668 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001669 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/generic.cpp",
1670 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_mmla_8x3VL/generic.cpp",
1671 "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_fp32_mla_8x1VL/generic.cpp",
1672 "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_s8s32_dot_8x1VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001673 "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_u8u32_dot_8x1VL/generic.cpp",
1674 "src/core/NEON/kernels/arm_gemm/mergeresults-sve.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001675 "src/core/NEON/kernels/arm_gemm/transform-sve.cpp",
1676 "src/core/NEON/kernels/arm_gemm/misc-sve.cpp"
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001677 ],
1678 "experimental_fixed_format_kernels": [
1679 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1680 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/a64fx.cpp",
1681 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/generic.cpp",
1682 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/a64fx.cpp",
1683 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/generic.cpp",
1684 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1685 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_bf16fp32_mmla_8x3VL/generic.cpp",
1686 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/a64fx.cpp",
1687 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/generic.cpp",
1688 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/a64fx.cpp",
1689 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/generic.cpp"
1690 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001691 }
1692 }
1693 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001694 "GenerateProposals": {
1695 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001696 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001697 "common": [
1698 "src/core/NEON/kernels/NEGenerateProposalsLayerKernel.cpp",
1699 "src/runtime/NEON/functions/NEGenerateProposalsLayer.cpp"
Dana Zlotnik50ce2772021-12-29 13:55:56 +02001700 ],
1701 "neon":{
1702 "common":["src/cpu/kernels/genproposals/generic/neon/impl.cpp"],
1703 "fp16":["src/cpu/kernels/genproposals/generic/neon/fp16.cpp"],
1704 "fp32":["src/cpu/kernels/genproposals/generic/neon/fp32.cpp"],
1705 "qsymm16":["src/cpu/kernels/genproposals/generic/neon/qsymm16.cpp"]
1706 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001707 }
1708 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001709 "InstanceNormalize": {
1710 "deps": [ "Permute", "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001711 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001712 "common": [
1713 "src/core/NEON/kernels/NEInstanceNormalizationLayerKernel.cpp",
1714 "src/runtime/NEON/functions/NEInstanceNormalizationLayer.cpp"
ramelg01a1f78512022-06-29 16:28:10 +01001715 ],
Dana Zlotnikd7e2ec52022-01-03 10:59:41 +02001716 "neon":{
1717 "common":["src/cpu/kernels/instancenorm/generic/neon/impl.cpp"],
1718 "fp16":["src/cpu/kernels/instancenorm/generic/neon/fp16.cpp"],
1719 "fp32":["src/cpu/kernels/instancenorm/generic/neon/fp32.cpp"]
1720 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001721 }
1722 },
1723 "L2Normalize": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001724 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001725 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001726 "common": [
1727 "src/core/NEON/kernels/NEL2NormalizeLayerKernel.cpp",
1728 "src/runtime/NEON/functions/NEL2NormalizeLayer.cpp"
Yair Schwarzbaum5e993182022-01-10 15:11:07 +02001729 ],
1730 "neon":{
1731 "common":["src/cpu/kernels/l2normlayer/generic/neon/impl.cpp"],
1732 "fp32":["src/cpu/kernels/l2normlayer/generic/neon/fp32.cpp"],
1733 "fp16":["src/cpu/kernels/l2normlayer/generic/neon/fp16.cpp"]
1734 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001735 }
1736 },
1737 "Logical": {
1738 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001739 "common": [
1740 "src/core/NEON/kernels/NELogicalKernel.cpp",
1741 "src/runtime/NEON/functions/NELogical.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001742 ]
1743 }
1744 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001745 "LSTM": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001746 "deps": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001747 "Activation",
1748 "Concatenate",
1749 "Copy",
1750 "Dequantize",
1751 "ElementwiseBinary",
1752 "Fill",
1753 "FullyConnected",
1754 "Gemm",
1755 "MeanStdDevNormalize",
1756 "Mul",
1757 "Quantize",
1758 "Slice",
1759 "Transpose"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001760 ],
1761 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001762 "common": [
1763 "src/core/NEON/kernels/NEQLSTMLayerNormalizationKernel.cpp",
1764 "src/runtime/NEON/functions/NELSTMLayer.cpp",
1765 "src/runtime/NEON/functions/NELSTMLayerQuantized.cpp",
1766 "src/runtime/NEON/functions/NEQLSTMLayer.cpp"
1767 ]
1768 }
1769 },
1770 "MaxUnpool2d": {
1771 "deps": [ "Fill" ],
1772 "files": {
1773 "common": [
Dana Zlotnik149203b2022-01-26 12:38:03 +02001774 "src/cpu/kernels/CpuMaxUnpoolingLayerKernel.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001775 "src/runtime/NEON/functions/NEMaxUnpoolingLayer.cpp",
Dana Zlotnik149203b2022-01-26 12:38:03 +02001776 "src/cpu/operators/CpuMaxUnpooling.cpp"
Dana Zlotnik143310c2021-12-30 13:24:52 +02001777 ],
1778 "neon":{
Dana Zlotnik143310c2021-12-30 13:24:52 +02001779 "fp32":["src/cpu/kernels/maxunpool/generic/neon/fp32.cpp"],
1780 "fp16":["src/cpu/kernels/maxunpool/generic/neon/fp16.cpp"],
1781 "qasymm8":["src/cpu/kernels/maxunpool/generic/neon/qasymm8.cpp"],
Dana Zlotnik149203b2022-01-26 12:38:03 +02001782 "qasymm8_signed":[ "src/cpu/kernels/maxunpool/generic/neon/qasymm8_signed.cpp"],
1783 "common":["src/cpu/kernels/maxunpool/generic/neon/impl.cpp"]
Dana Zlotnik143310c2021-12-30 13:24:52 +02001784 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001785 }
1786 },
1787 "Mean": {
1788 "deps" : [ "Reduction" ],
1789 "files": {
1790 "common": [ "src/runtime/NEON/functions/NEReduceMean.cpp" ]
1791 }
1792 },
1793 "MeanStdDevNormalize": {
1794 "files": {
1795 "common": [
1796 "src/core/NEON/kernels/NEMeanStdDevNormalizationKernel.cpp",
1797 "src/runtime/NEON/functions/NEMeanStdDevNormalizationLayer.cpp"
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001798 ],
1799 "neon":{
1800 "common":["src/cpu/kernels/meanstddevnorm/generic/neon/impl.cpp"],
1801 "fp32":["src/cpu/kernels/meanstddevnorm/generic/neon/fp32.cpp"],
Murray Kornelsen6e09e142022-07-13 21:40:26 -04001802 "fp16":["src/cpu/kernels/meanstddevnorm/generic/neon/fp16.cpp"],
1803 "qasymm8":["src/cpu/kernels/meanstddevnorm/generic/neon/qasymm8.cpp"]
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001804 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001805 }
1806 },
1807 "Mul": {
1808 "files": {
1809 "common": [
1810 "src/cpu/operators/CpuMul.cpp",
1811 "src/cpu/kernels/CpuMulKernel.cpp",
1812 "src/runtime/NEON/functions/NEPixelWiseMultiplication.cpp"
1813 ]
1814 }
1815 },
1816 "Normalize": {
1817 "deps": [ "Mul" ],
1818 "files": {
1819 "common": [
1820 "src/core/NEON/kernels/NENormalizationLayerKernel.cpp",
1821 "src/runtime/NEON/functions/NENormalizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001822 ]
1823 }
1824 },
1825 "Pad": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001826 "deps": [ "Concatenate", "Copy", "StridedSlice" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001827 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001828 "common": [
1829 "src/core/NEON/kernels/NEPadLayerKernel.cpp",
1830 "src/runtime/NEON/functions/NEPadLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001831 ]
1832 }
1833 },
1834 "Permute": {
1835 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001836 "common": [
1837 "src/cpu/operators/CpuPermute.cpp",
1838 "src/cpu/kernels/CpuPermuteKernel.cpp",
1839 "src/runtime/NEON/functions/NEPermute.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001840 ]
1841 }
1842 },
1843 "Pool2d": {
1844 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001845 "common": [
1846 "src/cpu/operators/CpuPool2d.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001847 "src/cpu/kernels/CpuPool2dKernel.cpp",
1848 "src/cpu/kernels/internal/CpuPool2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001849 "src/runtime/NEON/functions/NEPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001850 ],
1851 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001852 "common": [
1853 "src/core/NEON/kernels/arm_conv/pooling/kernels/cpp_nhwc_1x1_stride_any_depthfirst/generic.cpp",
1854 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp16.cpp",
1855 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp32.cpp",
1856 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8.cpp",
1857 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8q.cpp",
1858 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8.cpp",
1859 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8q.cpp",
1860 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1861 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1862 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1863 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1864 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1865 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1866 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1867 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1868 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1869 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1870 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_generic_depthfirst/generic.cpp",
1871 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1872 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1873 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1874 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1875 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_generic_depthfirst/generic.cpp",
1876 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001877 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001878 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001879 "nchw": [ "src/cpu/kernels/pool2d/neon/nchw/all.cpp" ],
1880 "fp16": [ "src/cpu/kernels/pool2d/neon/fp16.cpp" ],
ramelg01a1f78512022-06-29 16:28:10 +01001881 "fp32": [ "src/cpu/kernels/pool2d/neon/fp32.cpp" ],
1882 "qasymm8":[ "src/cpu/kernels/pool2d/neon/qasymm8.cpp" ],
Dana Zlotnika538ae52022-02-21 13:12:41 +02001883 "qasymm8_signed":["src/cpu/kernels/pool2d/neon/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001884 },
1885 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001886 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001887 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1888 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1889 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1890 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_generic_depthfirst/generic.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001891 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1892 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1893 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1894 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_generic_depthfirst/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001895 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1896 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1897 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_generic_depthfirst/generic.cpp",
1898 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1899 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1900 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1901 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1902 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_generic_depthfirst/generic.cpp",
1903 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001904 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_max_generic_depthfirst/generic.cpp",
1905 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1906 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1907 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1908 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1909 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1910 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1911 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1912 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1913 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1914 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1915 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_generic_depthfirst/generic.cpp",
1916 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1917 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1918 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1919 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1920 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_generic_depthfirst/generic.cpp",
1921 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
1922 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001923 ]
1924 }
1925 }
1926 },
Adnan AlSinan171fc3d2022-03-15 18:46:42 +00001927 "Pool3d": {
1928 "files": {
1929 "common": [
1930 "src/cpu/operators/CpuPool3d.cpp",
1931 "src/cpu/kernels/CpuPool3dKernel.cpp",
1932 "src/runtime/NEON/functions/NEPooling3dLayer.cpp"
1933 ],
1934 "neon": {
Adnan AlSinan9104cd52022-04-06 16:19:31 +01001935 "common": [ "src/cpu/kernels/pool3d/neon/impl.cpp" ],
1936 "fp16": [ "src/cpu/kernels/pool3d/neon/fp16.cpp" ],
1937 "fp32": [ "src/cpu/kernels/pool3d/neon/fp32.cpp" ],
1938 "qasymm8": [ "src/cpu/kernels/pool3d/neon/qasymm8.cpp" ],
1939 "qasymm8_signed": [ "src/cpu/kernels/pool3d/neon/qasymm8_signed.cpp" ]
Adnan AlSinan171fc3d2022-03-15 18:46:42 +00001940 }
1941 }
1942 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001943 "PRelu": {
1944 "deps": [ "ElementwiseBinary" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001945 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001946 "common": [
1947 "src/runtime/NEON/functions/NEPReluLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001948 ]
1949 }
1950 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001951 "PriorBox": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001952 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001953 "common": [
1954 "src/core/NEON/kernels/NEPriorBoxLayerKernel.cpp",
1955 "src/runtime/NEON/functions/NEPriorBoxLayer.cpp"
1956 ]
1957 }
1958 },
1959 "Quantize": {
1960 "files": {
1961 "common": [
1962 "src/cpu/operators/CpuQuantize.cpp",
1963 "src/cpu/kernels/CpuQuantizeKernel.cpp",
1964 "src/runtime/NEON/functions/NEQuantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001965 ]
1966 }
1967 },
1968 "Range": {
1969 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001970 "common": [
1971 "src/core/NEON/kernels/NERangeKernel.cpp",
1972 "src/runtime/NEON/functions/NERange.cpp"
Yair Schwarzbaum9e8a7702021-11-08 10:58:06 +02001973 ],
1974 "neon": {
1975 "common": [ "src/cpu/kernels/range/generic/neon/impl.cpp" ],
1976 "fp32": [ "src/cpu/kernels/range/generic/neon/fp32.cpp" ],
1977 "fp16": [ "src/cpu/kernels/range/generic/neon/fp16.cpp" ],
1978 "integer": [ "src/cpu/kernels/range/generic/neon/integer.cpp" ]
1979 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001980 }
1981 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001982 "Reduction":{
1983 "deps": [ "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001984 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001985 "common": [
1986 "src/core/NEON/kernels/NEReductionOperationKernel.cpp",
1987 "src/runtime/NEON/functions/NEReductionOperation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001988 ]
1989 }
1990 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001991 "Reorg": {
1992 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001993 "common": [
1994 "src/core/NEON/kernels/NEReorgLayerKernel.cpp",
1995 "src/runtime/NEON/functions/NEReorgLayer.cpp"
1996 ]
1997 }
1998 },
1999 "Reshape": {
2000 "files": {
2001 "common": [
2002 "src/cpu/operators/CpuReshape.cpp",
2003 "src/cpu/kernels/CpuReshapeKernel.cpp",
2004 "src/runtime/NEON/functions/NEReshapeLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002005 ]
2006 }
2007 },
2008 "Reverse": {
2009 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002010 "common": [
2011 "src/core/NEON/kernels/NEReverseKernel.cpp",
2012 "src/runtime/NEON/functions/NEReverse.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002013 ]
2014 }
2015 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002016 "RNN": {
2017 "deps": [ "Activation", "Add", "FullyConnected", "Gemm"],
2018 "files": {
2019 "common": [ "src/runtime/NEON/functions/NERNNLayer.cpp" ]
2020 }
2021 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002022 "ROIAlign": {
2023 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002024 "common": [
2025 "src/core/NEON/kernels/NEROIAlignLayerKernel.cpp",
2026 "src/runtime/NEON/functions/NEROIAlignLayer.cpp"
Dana Zlotnik9ae5a4e2022-01-03 16:22:47 +02002027 ],
2028 "neon":{
2029 "common":["src/cpu/kernels/roialign/generic/neon/impl.cpp"],
2030 "fp32":["src/cpu/kernels/roialign/generic/neon/fp32.cpp"],
2031 "fp16":["src/cpu/kernels/roialign/generic/neon/fp16.cpp"],
2032 "qasymm8":["src/cpu/kernels/roialign/generic/neon/qasymm8.cpp"],
2033 "qasymm8_signed":["src/cpu/kernels/roialign/generic/neon/qasymm8_signed.cpp"]
2034 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002035 }
2036 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002037 "ROIPool2d": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002038 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002039 "common": [
2040 "src/core/NEON/kernels/NEROIPoolingLayerKernel.cpp",
2041 "src/runtime/NEON/functions/NEROIPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002042 ]
2043 }
2044 },
2045 "Scale": {
2046 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002047 "common": [
2048 "src/cpu/operators/CpuScale.cpp",
2049 "src/cpu/kernels/CpuScaleKernel.cpp",
2050 "src/runtime/NEON/functions/NEScale.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002051 ],
2052 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002053 "fp16": [ "src/cpu/kernels/scale/sve/fp16.cpp" ],
2054 "fp32": [ "src/cpu/kernels/scale/sve/fp32.cpp" ],
2055 "integer": [ "src/cpu/kernels/scale/sve/integer.cpp" ],
2056 "qasymm8": [ "src/cpu/kernels/scale/sve/qasymm8.cpp" ],
2057 "qasymm8_signed": [ "src/cpu/kernels/scale/sve/qasymm8_signed.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002058 },
2059 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002060 "fp16": [ "src/cpu/kernels/scale/neon/fp16.cpp" ],
2061 "integer": [ "src/cpu/kernels/scale/neon/integer.cpp" ],
Gunes Bayirc4f27432022-09-11 15:59:19 +01002062 "qasymm8": [ "src/cpu/kernels/scale/neon/qasymm8.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ],
2063 "qasymm8_signed": [ "src/cpu/kernels/scale/neon/qasymm8_signed.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002064 }
2065 }
2066 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002067 "Select": {
2068 "files": {
2069 "common": [
2070 "src/core/NEON/kernels/NESelectKernel.cpp",
2071 "src/runtime/NEON/functions/NESelect.cpp"
Anton Vainer8a9a0fb2022-01-09 14:37:12 +02002072 ],
2073 "neon": {
2074 "common": [ "src/cpu/kernels/select/generic/neon/impl.cpp" ],
2075 "fp32": [ "src/cpu/kernels/select/generic/neon/fp32.cpp" ],
2076 "fp16": [ "src/cpu/kernels/select/generic/neon/fp16.cpp" ],
2077 "integer": [ "src/cpu/kernels/select/generic/neon/integer.cpp" ]
2078 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002079 }
2080 },
2081 "Slice": {
2082 "deps": [ "StridedSlice" ],
2083 "files": {
2084 "common": [ "src/runtime/NEON/functions/NESlice.cpp" ]
2085 }
2086 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002087 "Softmax": {
2088 "deps": [
2089 "Permute"
2090 ],
2091 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002092 "common": [
2093 "src/cpu/operators/CpuSoftmax.cpp",
2094 "src/cpu/kernels/CpuSoftmaxKernel.cpp",
2095 "src/runtime/NEON/functions/NESoftmaxLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002096 ],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002097 "neon":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02002098 "common":["src/cpu/kernels/softmax/generic/neon/impl.cpp"],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002099 "fp32": ["src/cpu/kernels/softmax/generic/neon/fp32.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01002100 "fp16": ["src/cpu/kernels/softmax/generic/neon/fp16.cpp"],
2101 "qasymm8":[ "src/cpu/kernels/softmax/generic/neon/qasymm8.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002102 "qasymm8_signed":["src/cpu/kernels/softmax/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002103 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002104 "sve": {
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002105 "common": [ "src/cpu/kernels/softmax/generic/sve/impl.cpp" ],
2106 "fp32": ["src/cpu/kernels/softmax/generic/sve/fp32.cpp"],
2107 "fp16": ["src/cpu/kernels/softmax/generic/sve/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002108 "qasymm8": ["src/cpu/kernels/softmax/generic/sve/qasymm8.cpp" ],
2109 "qasymm8_signed": ["src/cpu/kernels/softmax/generic/sve/qasymm8_signed.cpp"]
2110 },
2111 "sve2":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02002112 "common" :["src/cpu/kernels/softmax/generic/sve2/impl.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01002113 "qasymm8":[ "src/cpu/kernels/softmax/generic/sve2/qasymm8.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002114 "qasymm8_signed":["src/cpu/kernels/softmax/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002115 }
2116 }
2117 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002118 "SpaceToBatch": {
2119 "files": {
2120 "common": [
2121 "src/core/NEON/kernels/NESpaceToBatchLayerKernel.cpp",
2122 "src/runtime/NEON/functions/NESpaceToBatchLayer.cpp"
2123 ]
2124 }
2125 },
2126 "SpaceToDepth": {
2127 "files": {
2128 "common": [
2129 "src/core/NEON/kernels/NESpaceToDepthLayerKernel.cpp",
2130 "src/runtime/NEON/functions/NESpaceToDepthLayer.cpp"
2131 ]
2132 }
2133 },
2134 "Split": {
2135 "deps": [ "StridedSlice" ],
2136 "files": {
2137 "common": [
2138 "src/runtime/NEON/functions/NESplit.cpp"
2139 ]
2140 }
2141 },
2142 "Stack": {
2143 "files": {
2144 "common": [
2145 "src/core/NEON/kernels/NEStackLayerKernel.cpp",
2146 "src/runtime/NEON/functions/NEStackLayer.cpp"
2147 ]
2148 }
2149 },
2150 "StridedSlice": {
2151 "files": {
2152 "common": [
2153 "src/core/NEON/kernels/NEStridedSliceKernel.cpp",
2154 "src/runtime/NEON/functions/NEStridedSlice.cpp"
2155 ]
2156 }
2157 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002158 "Sub": {
2159 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002160 "common": [
2161 "src/cpu/operators/CpuSub.cpp",
2162 "src/cpu/kernels/CpuSubKernel.cpp",
Freddie Liardet487d3902021-09-21 12:36:43 +01002163 "src/runtime/NEON/functions/NEArithmeticSubtraction.cpp",
2164 "src/cpu/kernels/sub/neon/qasymm8.cpp",
2165 "src/cpu/kernels/sub/neon/qasymm8_signed.cpp",
2166 "src/cpu/kernels/sub/neon/qsymm16.cpp"
2167 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002168 }
2169 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002170 "Tile": {
2171 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002172 "common": [
2173 "src/core/NEON/kernels/NETileKernel.cpp",
2174 "src/runtime/NEON/functions/NETile.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002175 ]
2176 }
2177 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002178 "Transpose": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002179 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002180 "common": [
2181 "src/cpu/kernels/CpuTransposeKernel.cpp",
2182 "src/cpu/operators/CpuTranspose.cpp",
2183 "src/runtime/NEON/functions/NETranspose.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002184 ]
2185 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002186 },
2187 "Unstack": {
2188 "deps": [ "StridedSlice" ],
2189 "files": {
2190 "common": [ "src/runtime/NEON/functions/NEUnstack.cpp" ]
2191 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002192 }
2193 }
Giorgio Arena232c4522022-03-03 10:09:01 +00002194 },
2195 "experimental": {
2196 "dynamic_fusion": [
SiCong Lif44bbc52022-08-29 18:25:51 +01002197 "src/dynamic_fusion/runtime/gpu/cl/ClKernelRuntime.cpp",
2198 "src/dynamic_fusion/runtime/gpu/cl/ClWorkloadRuntime.cpp",
Gunes Bayir7dc02342022-11-21 21:46:50 +00002199
2200 "src/dynamic_fusion/sketch/attributes/DepthwiseConv2dAttributes.cpp",
SiCong Lif44bbc52022-08-29 18:25:51 +01002201 "src/dynamic_fusion/sketch/OperatorAttributes.cpp",
2202 "src/dynamic_fusion/sketch/gpu/GpuKernelArgument.cpp",
2203 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGraph.cpp",
2204 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGroup.cpp",
2205 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentStream.cpp",
2206 "src/dynamic_fusion/sketch/gpu/GpuLogicalKernel.cpp",
2207 "src/dynamic_fusion/sketch/gpu/GpuOperatorGroup.cpp",
2208 "src/dynamic_fusion/sketch/gpu/GpuWorkloadContext.cpp",
2209 "src/dynamic_fusion/sketch/gpu/GpuWorkloadSketch.cpp",
Gunes Bayir7dc02342022-11-21 21:46:50 +00002210 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDepthwiseConv2d.cpp",
SiCong Lif44bbc52022-08-29 18:25:51 +01002211 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDirectConv2d.cpp",
2212 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentStore.cpp",
2213 "src/dynamic_fusion/sketch/gpu/operators/GpuConv2d.cpp",
Gunes Bayir7dc02342022-11-21 21:46:50 +00002214 "src/dynamic_fusion/sketch/gpu/operators/GpuDepthwiseConv2d.cpp",
2215 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDepthwiseConv2d.cpp",
SiCong Lif44bbc52022-08-29 18:25:51 +01002216 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp",
2217 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateStore.cpp",
2218 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateWriter.cpp",
2219 "src/dynamic_fusion/sketch/gpu/template_writer/GpuKernelVariableTable.cpp"
Giorgio Arena232c4522022-03-03 10:09:01 +00002220 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002221 }
ramelg018a164882022-04-07 02:42:52 +01002222}