blob: 3fd48e669cdcf2e29d92c5f9dbf26bd21a194d66 [file] [log] [blame]
Georgios Pinitasbdcdc392021-04-22 16:42:03 +01001{
Michalis Spyrou20fca522021-06-07 14:23:57 +01002 "common": [
3 "src/common/cpuinfo/CpuInfo.cpp",
4 "src/common/cpuinfo/CpuModel.cpp",
5 "src/common/cpuinfo/CpuIsaInfo.cpp",
6 "src/common/utils/LegacySupport.cpp",
7 "src/common/AllocatorWrapper.cpp",
8 "src/common/ITensorV2.cpp",
Georgios Pinitas41648142021-08-03 08:24:00 +01009 "src/common/TensorPack.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010010 "src/common/IOperator.cpp",
11 "src/core/AccessWindowAutoPadding.cpp",
12 "src/core/AccessWindowStatic.cpp",
13 "src/core/AccessWindowTranspose.cpp",
14 "src/core/Error.cpp",
15 "src/core/GPUTarget.cpp",
16 "src/core/Helpers.cpp",
17 "src/core/IAccessWindow.cpp",
18 "src/core/IKernel.cpp",
19 "src/core/ITensor.cpp",
20 "src/core/ITensorPack.cpp",
21 "src/core/Rounding.cpp",
22 "src/core/Size2D.cpp",
23 "src/core/SubTensorInfo.cpp",
24 "src/core/TensorInfo.cpp",
25 "src/core/Utils.cpp",
26 "src/core/Validate.cpp",
27 "src/core/Version.cpp",
28 "src/core/helpers/SoftmaxHelpers.cpp",
Anitha Rajb566b6e2023-08-23 11:40:06 +010029 "src/core/helpers/Utils.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010030 "src/core/helpers/WindowHelpers.cpp",
Matthew Bentham314d3e22023-06-23 10:53:52 +000031 "src/core/utils/ActivationFunctionUtils.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010032 "src/core/utils/AssemblyUtils.cpp",
Matthew Bentham314d3e22023-06-23 10:53:52 +000033 "src/core/utils/DataTypeUtils.cpp",
34 "src/core/utils/DataLayoutUtils.cpp",
35 "src/core/utils/InterpolationPolicyUtils.cpp",
36 "src/core/utils/FormatUtils.cpp",
Viet-Hoa Doef9da002023-09-27 16:39:05 +010037 "src/core/utils/Math.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010038 "src/core/utils/ScaleUtils.cpp",
Matthew Bentham314d3e22023-06-23 10:53:52 +000039 "src/core/utils/StringUtils.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010040 "src/core/utils/helpers/fft.cpp",
41 "src/core/utils/helpers/tensor_transform.cpp",
42 "src/core/utils/io/FileHandler.cpp",
43 "src/core/utils/misc/MMappedFile.cpp",
44 "src/core/utils/quantization/AsymmHelpers.cpp",
45 "src/core/CPP/CPPTypes.cpp",
46 "src/core/CPP/kernels/CPPBoxWithNonMaximaSuppressionLimitKernel.cpp",
47 "src/core/CPP/kernels/CPPNonMaximumSuppressionKernel.cpp",
48 "src/core/CPP/kernels/CPPPermuteKernel.cpp",
49 "src/core/CPP/kernels/CPPTopKVKernel.cpp",
50 "src/core/CPP/kernels/CPPUpsampleKernel.cpp",
51 "src/runtime/Allocator.cpp",
52 "src/runtime/BlobLifetimeManager.cpp",
53 "src/runtime/BlobMemoryPool.cpp",
54 "src/runtime/ISimpleLifetimeManager.cpp",
55 "src/runtime/ITensorAllocator.cpp",
56 "src/runtime/IWeightsManager.cpp",
57 "src/runtime/IScheduler.cpp",
58 "src/runtime/Memory.cpp",
59 "src/runtime/MemoryManagerOnDemand.cpp",
60 "src/runtime/OffsetLifetimeManager.cpp",
61 "src/runtime/OffsetMemoryPool.cpp",
62 "src/runtime/OperatorTensor.cpp",
63 "src/runtime/PoolManager.cpp",
64 "src/runtime/RuntimeContext.cpp",
65 "src/runtime/Scheduler.cpp",
66 "src/runtime/SchedulerFactory.cpp",
67 "src/runtime/SchedulerUtils.cpp",
68 "src/runtime/SubTensor.cpp",
69 "src/runtime/Tensor.cpp",
70 "src/runtime/TensorAllocator.cpp",
71 "src/runtime/Utils.cpp",
72 "src/runtime/CPP/ICPPSimpleFunction.cpp",
73 "src/runtime/CPP/functions/CPPBoxWithNonMaximaSuppressionLimit.cpp",
74 "src/runtime/CPP/functions/CPPDetectionOutputLayer.cpp",
75 "src/runtime/CPP/functions/CPPDetectionPostProcessLayer.cpp",
76 "src/runtime/CPP/functions/CPPNonMaximumSuppression.cpp",
77 "src/runtime/CPP/functions/CPPPermute.cpp",
78 "src/runtime/CPP/functions/CPPTopKV.cpp",
79 "src/runtime/CPP/functions/CPPUpsample.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +010080 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +010081 "logging": [
82 "src/core/utils/logging/FilePrinter.cpp",
83 "src/core/utils/logging/Helpers.cpp",
84 "src/core/utils/logging/Logger.cpp",
85 "src/core/utils/logging/LoggerRegistry.cpp"
86 ],
87 "scheduler": {
88 "single": [ "src/runtime/CPP/SingleThreadScheduler.cpp" ],
89 "threads": [ "src/runtime/CPP/CPPScheduler.cpp" ],
90 "omp": [ "src/runtime/OMP/OMPScheduler.cpp"]
91 },
Michalis Spyrou20fca522021-06-07 14:23:57 +010092 "c_api": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +010093 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +010094 "src/c/AclContext.cpp",
Georgios Pinitas06ac6e42021-07-05 08:08:52 +010095 "src/c/AclOperator.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +010096 "src/c/AclQueue.cpp",
97 "src/c/AclTensor.cpp",
98 "src/c/AclTensorPack.cpp",
99 "src/c/AclVersion.cpp"
Georgios Pinitasbdcdc392021-04-22 16:42:03 +0100100 ],
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100101 "cpu": [
102 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100103 "gpu": [
104 "src/c/cl/AclOpenClExt.cpp"
Georgios Pinitas41648142021-08-03 08:24:00 +0100105 ],
106 "operators":
107 [
108 "src/c/operators/AclActivation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100109 ]
110 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100111 "high_priority": [
112 "Activation",
113 "DepthwiseConv2d",
114 "Conv2d",
115 "Permute",
116 "Pool2d",
SiCong Li83d06742023-05-11 11:54:22 +0100117 "Reshape",
118 "MatMul"
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100119 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100120 "gpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100121 "common": [
Viet-Hoa Do500e10b2023-09-12 17:49:38 +0100122 "src/core/CL/CLCommandBuffer.cpp",
123 "src/core/CL/CLCompatCommandBuffer.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100124 "src/core/CL/CLCompileContext.cpp",
Viet-Hoa Do500e10b2023-09-12 17:49:38 +0100125 "src/core/CL/CLMutableCommandBuffer.cpp",
Giorgio Arenaba2dd822021-07-28 16:10:03 +0100126 "src/core/CL/DefaultLWSHeuristics.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100127 "src/core/CL/CLHelpers.cpp",
128 "src/core/CL/CLKernelLibrary.cpp",
129 "src/core/CL/CLUtils.cpp",
130 "src/core/CL/ICLKernel.cpp",
131 "src/core/CL/ICLSimple2DKernel.cpp",
132 "src/core/CL/ICLSimple3DKernel.cpp",
133 "src/core/CL/ICLSimpleKernel.cpp",
134 "src/core/CL/ICLTensor.cpp",
135 "src/core/CL/OpenCL.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100136 "src/gpu/cl/ClContext.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100137 "src/gpu/cl/ClKernelLibrary.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100138 "src/gpu/cl/ClQueue.cpp",
139 "src/gpu/cl/ClTensor.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100140 "src/core/CL/kernels/CLFillBorderKernel.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100141 "src/runtime/CL/CLBufferAllocator.cpp",
142 "src/runtime/CL/CLGEMMHeuristicsHandle.cpp",
143 "src/runtime/CL/CLHelpers.cpp",
144 "src/runtime/CL/CLMemory.cpp",
145 "src/runtime/CL/CLMemoryRegion.cpp",
146 "src/runtime/CL/CLOperator.cpp",
147 "src/runtime/CL/CLRuntimeContext.cpp",
148 "src/runtime/CL/CLScheduler.cpp",
149 "src/runtime/CL/CLSubTensor.cpp",
150 "src/runtime/CL/CLTensor.cpp",
151 "src/runtime/CL/CLTensorAllocator.cpp",
152 "src/runtime/CL/CLTuner.cpp",
153 "src/runtime/CL/ICLSimpleFunction.cpp",
154 "src/runtime/CL/Utils.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100155 "src/runtime/CL/mlgo/HeuristicTree.cpp",
156 "src/runtime/CL/mlgo/MLGOHeuristics.cpp",
157 "src/runtime/CL/mlgo/MLGOParser.cpp",
158 "src/runtime/CL/mlgo/Utils.cpp",
159 "src/runtime/CL/tuners/CLTuningParametersList.cpp"
160 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100161 "operators": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100162 "Activation":{
163 "files": {
164 "common": [
165 "src/gpu/cl/kernels/ClActivationKernel.cpp",
166 "src/gpu/cl/operators/ClActivation.cpp",
167 "src/runtime/CL/functions/CLActivationLayer.cpp"
168 ]
169 }
170 },
171 "ArgMinMax": {
172 "deps": [ "Reshape" ],
173 "files": {
174 "common": [
175 "src/core/CL/kernels/CLArgMinMaxLayerKernel.cpp",
176 "src/runtime/CL/functions/CLArgMinMaxLayer.cpp"
177 ]
178 }
179 },
180 "Add": {
181 "files": {
182 "common": [
183 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
184 "src/gpu/cl/operators/ClAdd.cpp"
185 ]
186 }
187 },
188 "BatchNormalization": {
189 "files": {
190 "common": [
191 "src/core/CL/kernels/CLBatchNormalizationLayerKernel.cpp",
192 "src/core/CL/kernels/CLFuseBatchNormalizationKernel.cpp",
193 "src/runtime/CL/functions/CLBatchNormalizationLayer.cpp",
194 "src/runtime/CL/functions/CLFuseBatchNormalization.cpp"
195 ]
196 }
197 },
198 "BatchToSpace": {
199 "files": {
200 "common": [
201 "src/core/CL/kernels/CLBatchToSpaceLayerKernel.cpp",
202 "src/runtime/CL/functions/CLBatchToSpaceLayer.cpp"
203 ]
204 }
205 },
206 "Bitwise": {
207 "files": {
208 "common": [ "src/core/CL/kernels/CLBitwiseKernel.cpp" ]
209 }
210 },
211 "BitwiseAnd": {
212 "deps": [ "Bitwise" ],
213 "files": {
214 "common": [ "src/runtime/CL/functions/CLBitwiseAnd.cpp" ]
215 }
216 },
217 "BitwiseNot": {
218 "deps": [ "Bitwise" ],
219 "files": {
220 "common": [ "src/runtime/CL/functions/CLBitwiseNot.cpp" ]
221 }
222 },
223 "BitwiseOr": {
224 "deps": [ "Bitwise" ],
225 "files": {
226 "common": [ "src/runtime/CL/functions/CLBitwiseOr.cpp" ]
227 }
228 },
229 "BitwiseXor": {
230 "deps": [ "Bitwise" ],
231 "files": {
232 "common": [ "src/runtime/CL/functions/CLBitwiseXor.cpp" ]
233 }
234 },
235 "BoundingBoxTransform": {
236 "files": {
237 "common": [
238 "src/core/CL/kernels/CLBoundingBoxTransformKernel.cpp",
239 "src/runtime/CL/functions/CLBoundingBoxTransform.cpp"
240 ]
241 }
242 },
243 "Cast": {
244 "files": {
245 "common": [
246 "src/gpu/cl/kernels/ClCastKernel.cpp",
247 "src/gpu/cl/operators/ClCast.cpp",
248 "src/runtime/CL/functions/CLCast.cpp"
249 ]
250 }
251 },
252 "ChannelShuffle": {
253 "files": {
254 "common": [
255 "src/core/CL/kernels/CLChannelShuffleLayerKernel.cpp",
256 "src/runtime/CL/functions/CLChannelShuffleLayer.cpp"
257 ]
258 }
259 },
260 "Comparison": {
261 "files": {
262 "common": [
263 "src/core/CL/kernels/CLComparisonKernel.cpp",
264 "src/runtime/CL/functions/CLComparison.cpp"
265 ]
266 }
267 },
268 "Concatenate": {
269 "files": {
270 "common": [
271 "src/gpu/cl/kernels/ClBatchConcatenateKernel.cpp",
272 "src/gpu/cl/kernels/ClDepthConcatenateKernel.cpp",
273 "src/gpu/cl/kernels/ClHeightConcatenateKernel.cpp",
274 "src/gpu/cl/kernels/ClWidthConcatenate2TensorsKernel.cpp",
275 "src/gpu/cl/kernels/ClWidthConcatenate4TensorsKernel.cpp",
276 "src/gpu/cl/kernels/ClWidthConcatenateKernel.cpp",
277 "src/gpu/cl/operators/ClConcatenate.cpp",
278 "src/runtime/CL/functions/CLConcatenateLayer.cpp"
279 ]
280 }
281 },
282 "Conv2d": {
283 "deps": [
284 "Activation",
285 "ElementwiseBinary",
286 "FFT2D",
287 "Gemm",
288 "Mul",
289 "Pad",
290 "Permute",
291 "Reduction",
292 "Reshape",
293 "Reverse",
294 "Slice"
295 ],
296 "files": {
297 "common": [
298 "src/gpu/cl/kernels/ClDirectConv2dKernel.cpp",
299 "src/gpu/cl/kernels/ClWinogradFilterTransformKernel.cpp",
300 "src/gpu/cl/kernels/ClWinogradInputTransformKernel.cpp",
301 "src/gpu/cl/kernels/ClWinogradOutputTransformKernel.cpp",
302 "src/gpu/cl/kernels/ClIm2ColKernel.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000303 "src/gpu/cl/kernels/ClIndirectConv2dKernel.cpp",
Gian Marco Iodice5d016812022-11-17 11:03:39 +0000304 "src/gpu/cl/kernels/ClIndirectConv2dAddressPrecalculationKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100305 "src/gpu/cl/kernels/ClCol2ImKernel.cpp",
306 "src/gpu/cl/operators/ClConv2d.cpp",
307 "src/gpu/cl/operators/ClDirectConv2d.cpp",
308 "src/gpu/cl/operators/ClGemmConv2d.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000309 "src/gpu/cl/operators/ClIndirectConv2d.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100310 "src/gpu/cl/operators/ClWinogradConv2d.cpp",
311 "src/gpu/cl/kernels/ClWeightsReshapeKernel.cpp",
312 "src/runtime/CL/functions/CLConvolutionLayer.cpp",
313 "src/runtime/CL/functions/CLDirectConvolutionLayer.cpp",
314 "src/runtime/CL/functions/CLFFTConvolutionLayer.cpp",
315 "src/runtime/CL/functions/CLGEMMConvolutionLayer.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000316 "src/runtime/CL/functions/CLIndirectConvolutionLayer.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100317 "src/runtime/CL/functions/CLWinogradConvolutionLayer.cpp"
318 ]
319 }
320 },
Giorgio Arena273c28c2021-10-14 15:59:15 +0100321 "Conv3d": {
322 "files": {
323 "common": [
324 "src/gpu/cl/kernels/ClDirectConv3dKernel.cpp",
325 "src/gpu/cl/operators/ClDirectConv3d.cpp",
326 "src/runtime/CL/functions/CLConv3D.cpp"
327 ]
328 }
329 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100330 "Copy": {
331 "files": {
332 "common": [
333 "src/gpu/cl/kernels/ClCopyKernel.cpp",
334 "src/gpu/cl/operators/ClCopy.cpp",
335 "src/runtime/CL/functions/CLCopy.cpp"
336 ]
337 }
338 },
339 "CropResize": {
340 "deps": [ "Copy", "Fill", "Scale" ],
341 "files": {
342 "common": [
343 "src/gpu/cl/kernels/ClCropKernel.cpp",
344 "src/gpu/cl/operators/ClCrop.cpp",
345 "src/runtime/CL/functions/CLCrop.cpp",
346 "src/runtime/CL/functions/CLCropResize.cpp"
347 ]
348 }
349 },
350 "Deconv2d": {
351 "deps": [ "Conv2d", "Reverse", "Transpose"],
352 "files": {
353 "common": [
354 "src/core/CL/kernels/CLDeconvolutionLayerUpsampleKernel.cpp",
355 "src/core/CL/kernels/CLDeconvolutionReshapeOutputKernel.cpp",
Gunes Bayirec0113d2022-11-09 09:26:27 +0000356 "src/gpu/cl/kernels/ClTransposedConvolutionKernel.cpp",
357 "src/gpu/cl/operators/ClTransposedConvolution.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100358 "src/runtime/CL/functions/CLDeconvolutionLayer.cpp",
359 "src/runtime/CL/functions/CLDeconvolutionLayerUpsample.cpp",
360 "src/runtime/CL/functions/CLDirectDeconvolutionLayer.cpp",
361 "src/runtime/CL/functions/CLGEMMDeconvolutionLayer.cpp"
362 ]
363 }
364 },
365 "DepthConvert": {
366 "deps": [ "Cast"],
367 "files": {
368 "common": [ "src/runtime/CL/functions/CLDepthConvertLayer.cpp" ]
369 }
370 },
371 "DepthToSpace": {
372 "files": {
373 "common": [
374 "src/core/CL/kernels/CLDepthToSpaceLayerKernel.cpp",
375 "src/runtime/CL/functions/CLDepthToSpaceLayer.cpp"
376 ]
377 }
378 },
379 "DepthwiseConv2d": {
380 "deps": [ "Permute" ],
381 "files": {
382 "common": [
383 "src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp",
384 "src/runtime/CL/functions/CLDepthwiseConvolutionLayer.cpp"
385 ]
386 }
387 },
388 "Dequantize": {
389 "files": {
390 "common": [
391 "src/gpu/cl/kernels/ClDequantizeKernel.cpp",
392 "src/gpu/cl/operators/ClDequantize.cpp",
393 "src/runtime/CL/functions/CLDequantizationLayer.cpp"
394 ]
395 }
396 },
397 "ElementwiseBinary": {
398 "deps": ["Add", "Sub"],
399 "files": {
400 "common": [
401 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
402 "src/gpu/cl/operators/ClElementwiseOperations.cpp",
403 "src/runtime/CL/functions/CLElementwiseOperations.cpp"
404 ]
405 }
406 },
407 "ElementwiseUnary":{
408 "files": {
409 "common": [
410 "src/gpu/cl/kernels/ClElementwiseUnaryKernel.cpp",
411 "src/gpu/cl/operators/ClElementwiseUnary.cpp",
412 "src/runtime/CL/functions/CLElementwiseUnaryLayer.cpp"
413 ]
414 }
415 },
416 "FFT1D": {
417 "files": {
418 "common": [
419 "src/core/CL/kernels/CLFFTDigitReverseKernel.cpp",
420 "src/core/CL/kernels/CLFFTRadixStageKernel.cpp",
421 "src/core/CL/kernels/CLFFTScaleKernel.cpp",
422 "src/runtime/CL/functions/CLFFT1D.cpp"
423 ]
424 }
425 },
426 "FFT2D": {
427 "deps": [ "FFT1D" ],
428 "files": {
429 "common": [ "src/runtime/CL/functions/CLFFT2D.cpp" ]
430 }
431 },
432 "Fill": {
433 "files": {
434 "common": [
435 "src/gpu/cl/kernels/ClFillKernel.cpp",
436 "src/gpu/cl/operators/ClFill.cpp",
437 "src/runtime/CL/functions/CLFill.cpp"
438 ]
439 }
440 },
441 "Flatten": {
442 "files": {
443 "common": [
444 "src/gpu/cl/operators/ClFlatten.cpp",
445 "src/runtime/CL/functions/CLFlattenLayer.cpp"
446 ]
447 }
448 },
449 "Floor": {
450 "files": {
451 "common": [
452 "src/gpu/cl/kernels/ClFloorKernel.cpp",
453 "src/gpu/cl/operators/ClFloor.cpp",
454 "src/runtime/CL/functions/CLFloor.cpp"
455 ]
456 }
457 },
458 "FullyConnected": {
459 "deps": [ "Flatten", "Gemm", "Transpose"],
460 "files": {
461 "common": [
462 "src/gpu/cl/kernels/ClConvertFullyConnectedWeightsKernel.cpp",
463 "src/gpu/cl/operators/ClConvertFullyConnectedWeights.cpp",
464 "src/gpu/cl/operators/ClFullyConnected.cpp",
465 "src/runtime/CL/functions/CLConvertFullyConnectedWeights.cpp",
466 "src/runtime/CL/functions/CLFullyConnectedLayer.cpp"
467 ]
468 }
469 },
470 "Gather": {
471 "files": {
472 "common": [
473 "src/core/CL/kernels/CLGatherKernel.cpp",
474 "src/runtime/CL/functions/CLGather.cpp"]
475 }
476 },
477 "Gemm": {
478 "deps": [ "Cast" ],
479 "files": {
480 "common": [
481 "src/gpu/cl/kernels/gemm/ClGemmHelpers.cpp",
482 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeBifrost.cpp",
483 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeMidgard.cpp",
484 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeValhall.cpp",
485 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedBifrost.cpp",
486 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedValhall.cpp",
487 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyBifrost.cpp",
488 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyValhall.cpp",
489 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyNativeKernel.cpp",
490 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedKernel.cpp",
491 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsKernel.cpp",
Freddie Liardete572dff2022-05-16 14:09:10 +0100492 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100493 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionKernel.cpp",
494 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionOutputStageKernel.cpp",
495 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFixedPointKernel.cpp",
496 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFloatKernel.cpp",
497 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100498 "src/gpu/cl/kernels/ClGemmMatrixMultiplyNativeKernel.cpp",
Gunes Bayir4bfc70e2021-12-10 16:17:56 +0000499 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100500 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedKernel.cpp",
501 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsKernel.cpp",
502 "src/gpu/cl/kernels/ClGemmReshapeLhsMatrixKernel.cpp",
503 "src/gpu/cl/kernels/ClGemmReshapeRhsMatrixKernel.cpp",
504 "src/gpu/cl/kernels/ClGemmLowpReductionKernel.cpp",
505 "src/gpu/cl/operators/ClGemm.cpp",
506 "src/gpu/cl/operators/ClGemmLowpMatrixMultiplyCore.cpp",
507 "src/gpu/cl/operators/ClGemmLowpOutputStage.cpp",
508 "src/runtime/CL/gemm/CLGEMMDefaultTypeBifrost.cpp",
509 "src/runtime/CL/gemm/CLGEMMDefaultTypeMidgard.cpp",
510 "src/runtime/CL/gemm/CLGEMMDefaultTypeValhall.cpp",
511 "src/runtime/CL/gemm_auto_heuristics/CLGEMMAutoHeuristics.cpp",
512 "src/runtime/CL/functions/CLGEMM.cpp",
513 "src/runtime/CL/functions/CLGEMMLowpMatrixMultiplyCore.cpp",
Ramy Elgammaldf6a3b02022-11-30 16:23:10 +0000514 "src/runtime/CL/functions/CLGEMMLowpOutputStage.cpp",
515 "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigBifrost.cpp",
Gian Marco Iodicea5cb79f2022-12-28 13:53:51 +0000516 "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigValhall.cpp",
Gian Marco Iodice9d3bd412022-12-30 09:45:00 +0000517 "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigBifrost.cpp",
518 "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigValhall.cpp",
519 "src/runtime/heuristics/dwc_native/ClDWCNativeHeuristicsHelpers.cpp",
Ramy Elgammal34a95d12023-05-11 18:23:44 +0100520 "src/runtime/heuristics/indirect_conv/ClIndirectConvDefaultConfigValhall.cpp"
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100521 ]
522 }
523 },
Ramy Elgammal2b6ebfe2023-03-09 21:15:37 +0000524 "MatMul": {
525 "files": {
526 "common": [
Gunes Bayir9d0c4de2023-04-13 18:22:58 +0100527 "src/gpu/cl/kernels/ClMatMulLowpNativeKernel.cpp",
Gunes Bayire87fa662023-09-07 12:20:33 +0100528 "src/gpu/cl/kernels/ClMatMulLowpNativeMMULKernel.cpp",
Jakub Sujak1ed6a142023-04-13 21:14:42 +0100529 "src/gpu/cl/kernels/ClMatMulNativeKernel.cpp",
SiCong Lia8d80582023-05-19 14:23:37 +0100530 "src/gpu/cl/kernels/ClMatMulNativeMMULKernel.cpp",
Gunes Bayire87fa662023-09-07 12:20:33 +0100531 "src/gpu/cl/kernels/helpers/MatMulKernelHelpers.cpp",
Ramy Elgammalf26ea2f2023-03-24 11:42:03 +0000532 "src/gpu/cl/operators/ClMatMul.cpp",
Ramy Elgammal34a95d12023-05-11 18:23:44 +0100533 "src/runtime/CL/functions/CLMatMul.cpp",
534 "src/runtime/heuristics/matmul_native/ClMatMulNativeDefaultConfigValhall.cpp",
535 "src/runtime/heuristics/matmul_native/ClMatMulNativeHelpers.cpp"
Ramy Elgammal2b6ebfe2023-03-09 21:15:37 +0000536 ]
537 }
538 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100539 "GenerateProposals": {
540 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
541 "files": {
542 "common": [
543 "src/core/CL/kernels/CLGenerateProposalsLayerKernel.cpp",
544 "src/runtime/CL/functions/CLGenerateProposalsLayer.cpp"
545 ]
546 }
547 },
548 "InstanceNormalize": {
549 "files": {
550 "common": [
551 "src/core/CL/kernels/CLInstanceNormalizationLayerKernel.cpp",
552 "src/runtime/CL/functions/CLInstanceNormalizationLayer.cpp"
553 ]
554 }
555 },
556 "L2Normalize": {
557 "deps": [ "Reduction" ],
558 "files": {
559 "common": [
560 "src/core/CL/kernels/CLL2NormalizeLayerKernel.cpp",
561 "src/runtime/CL/functions/CLL2NormalizeLayer.cpp"
562 ]
563 }
564 },
565 "Logical": {
566 "files": {
567 "common": [
568 "src/gpu/cl/operators/ClLogicalNot.cpp",
569 "src/runtime/CL/functions/CLLogicalAnd.cpp",
570 "src/runtime/CL/functions/CLLogicalNot.cpp",
571 "src/runtime/CL/functions/CLLogicalOr.cpp"
572 ]
573 }
574 },
575 "LSTM": {
576 "deps": [
577 "Activation",
578 "Concatenate",
579 "Copy",
580 "Dequantize",
581 "ElementwiseBinary",
582 "Fill",
583 "FullyConnected",
584 "Gemm",
585 "MeanStdDevNormalize",
586 "Mul",
587 "Quantize",
588 "Slice",
589 "Transpose"
590 ],
591 "files": {
592 "common": [
593 "src/core/CL/kernels/CLQLSTMLayerNormalizationKernel.cpp",
594 "src/runtime/CL/functions/CLQLSTMLayer.cpp",
595 "src/runtime/CL/functions/CLLSTMLayer.cpp",
596 "src/runtime/CL/functions/CLLSTMLayerQuantized.cpp"
597 ]
598 }
599 },
600 "MaxUnpool2d": {
601 "deps": [ "Fill" ],
602 "files": {
603 "common": [
604 "src/core/CL/kernels/CLMaxUnpoolingLayerKernel.cpp",
605 "src/runtime/CL/functions/CLMaxUnpoolingLayer.cpp"
606 ]
607 }
608 },
609 "MeanStdDevNormalize": {
610 "deps": [ "Reduction" ],
611 "files": {
612 "common": [
613 "src/core/CL/kernels/CLMeanStdDevNormalizationKernel.cpp",
614 "src/runtime/CL/functions/CLMeanStdDevNormalizationLayer.cpp",
615 "src/runtime/CL/functions/CLReduceMean.cpp"
616 ]
617 }
618 },
619 "Mul": {
620 "files": {
621 "common": [
622 "src/gpu/cl/kernels/ClMulKernel.cpp",
623 "src/gpu/cl/operators/ClMul.cpp",
624 "src/runtime/CL/functions/CLPixelWiseMultiplication.cpp"
625 ]
626 }
627 },
628 "Normalize": {
629 "files": {
630 "common": [
631 "src/core/CL/kernels/CLNormalizationLayerKernel.cpp",
632 "src/runtime/CL/functions/CLNormalizationLayer.cpp"
633 ]
634 }
635 },
636 "Pad": {
637 "deps": [ "Copy" ],
638 "files": {
639 "common": [
640 "src/core/CL/kernels/CLPadLayerKernel.cpp",
641 "src/runtime/CL/functions/CLPadLayer.cpp"
642 ]
643 }
644 },
645 "Permute": {
646 "files": {
647 "common": [
648 "src/gpu/cl/kernels/ClPermuteKernel.cpp",
649 "src/gpu/cl/operators/ClPermute.cpp",
650 "src/runtime/CL/functions/CLPermute.cpp"
651 ]
652 }
653 },
654 "Pool2d": {
655 "files": {
656 "common": [
657 "src/gpu/cl/kernels/ClPool2dKernel.cpp",
658 "src/gpu/cl/operators/ClPool2d.cpp",
659 "src/runtime/CL/functions/CLPoolingLayer.cpp"
660 ]
661 }
662 },
ramelg0137515692022-02-26 22:06:20 +0000663 "Pool3d": {
664 "files": {
665 "common": [
666 "src/gpu/cl/kernels/ClPool3dKernel.cpp",
667 "src/gpu/cl/operators/ClPool3d.cpp",
668 "src/runtime/CL/functions/CLPooling3dLayer.cpp"
669 ]
670 }
671 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100672 "PRelu": {
673 "deps": [ "ElementwiseBinary" ],
674 "files": {
675 "common": [
676 "src/gpu/cl/operators/ClPRelu.cpp",
677 "src/runtime/CL/functions/CLPReluLayer.cpp"
678 ]
679 }
680 },
681 "PriorBox": {
682 "files": {
683 "common": [
684 "src/core/CL/kernels/CLPriorBoxLayerKernel.cpp",
685 "src/runtime/CL/functions/CLPriorBoxLayer.cpp"
686 ]
687 }
688 },
689 "Quantize": {
690 "files": {
691 "common": [
692 "src/gpu/cl/kernels/ClQuantizeKernel.cpp",
693 "src/gpu/cl/operators/ClQuantize.cpp",
694 "src/runtime/CL/functions/CLQuantizationLayer.cpp"
695 ]
696 }
697 },
698 "Range": {
699 "files": {
700 "common": [
701 "src/core/CL/kernels/CLRangeKernel.cpp",
702 "src/runtime/CL/functions/CLRange.cpp"
703 ]
704 }
705 },
706 "Reduction": {
707 "deps": [ "Reshape" ],
708 "files": {
ramelg01a1f78512022-06-29 16:28:10 +0100709 "common": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100710 "src/core/CL/kernels/CLReductionOperationKernel.cpp",
711 "src/runtime/CL/functions/CLReductionOperation.cpp"
712 ]
713 }
714 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100715 "Reorg": {
716 "files": {
717 "common": [
718 "src/core/CL/kernels/CLReorgLayerKernel.cpp",
719 "src/runtime/CL/functions/CLReorgLayer.cpp"
720 ]
721 }
722 },
723 "Reshape": {
724 "files": {
725 "common": [
726 "src/gpu/cl/kernels/ClReshapeKernel.cpp",
727 "src/gpu/cl/operators/ClReshape.cpp",
728 "src/runtime/CL/functions/CLReshapeLayer.cpp"
729 ]
730 }
731 },
732 "Reverse": {
733 "files": {
734 "common": [
735 "src/core/CL/kernels/CLReverseKernel.cpp",
736 "src/runtime/CL/functions/CLReverse.cpp"
737 ]
738 }
739 },
740 "RNN": {
741 "deps": [ "Activation", "Cast", "ElementwiseBinary", "FullyConnected", "Gemm"],
742 "files": {
743 "common": [ "src/runtime/CL/functions/CLRNNLayer.cpp" ]
744 }
745 },
746 "ROIAlign": {
747 "files": {
748 "common": [
749 "src/core/CL/kernels/CLROIAlignLayerKernel.cpp",
750 "src/runtime/CL/functions/CLROIAlignLayer.cpp"
751 ]
752 }
753 },
754 "ROIPool2d": {
755 "files": {
756 "common": [
757 "src/core/CL/kernels/CLROIPoolingLayerKernel.cpp",
758 "src/runtime/CL/functions/CLROIPoolingLayer.cpp"
759 ]
760 }
761 },
762 "Scale": {
763 "files": {
764 "common": [
765 "src/gpu/cl/kernels/ClScaleKernel.cpp",
766 "src/gpu/cl/operators/ClScale.cpp",
767 "src/runtime/CL/functions/CLScale.cpp"
768 ]
769 }
770 },
771 "Select": {
772 "files": {
773 "common": [
774 "src/core/CL/kernels/CLSelectKernel.cpp",
775 "src/runtime/CL/functions/CLSelect.cpp"
776 ]
777 }
778 },
779 "Slice": {
780 "deps": [ "StridedSlice" ],
781 "files": {
782 "common": [ "src/runtime/CL/functions/CLSlice.cpp" ]
783 }
784 },
785 "Softmax": {
786 "deps": [ "Permute" ],
787 "files": {
788 "common": [
789 "src/gpu/cl/kernels/ClSoftmaxKernel.cpp",
790 "src/gpu/cl/operators/ClSoftmax.cpp",
791 "src/runtime/CL/functions/CLSoftmaxLayer.cpp"
792 ]
793 }
794 },
795 "SpaceToBatch": {
796 "files": {
797 "common": [
798 "src/core/CL/kernels/CLSpaceToBatchLayerKernel.cpp",
799 "src/runtime/CL/functions/CLSpaceToBatchLayer.cpp"
800 ]
801 }
802 },
803 "SpaceToDepth": {
804 "files": {
805 "common": [
806 "src/core/CL/kernels/CLSpaceToDepthLayerKernel.cpp",
807 "src/runtime/CL/functions/CLSpaceToDepthLayer.cpp"
808 ]
809 }
810 },
811 "Split": {
812 "deps": [ "StridedSlice" ],
813 "files": {
814 "common": [ "src/runtime/CL/functions/CLSplit.cpp" ]
815 }
816 },
817 "Stack": {
818 "files": {
819 "common": [
820 "src/core/CL/kernels/CLStackLayerKernel.cpp",
821 "src/runtime/CL/functions/CLStackLayer.cpp"
822 ]
823 }
824 },
825 "StridedSlice": {
826 "files": {
827 "common": [
828 "src/core/CL/kernels/CLStridedSliceKernel.cpp",
829 "src/runtime/CL/functions/CLStridedSlice.cpp"
830 ]
831 }
832 },
833 "Sub": {
834 "files": {
835 "common": [
836 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
837 "src/gpu/cl/operators/ClSub.cpp"
838 ]
839 }
840 },
841 "Tile": {
842 "files": {
843 "common": [
844 "src/core/CL/kernels/CLTileKernel.cpp",
845 "src/runtime/CL/functions/CLTile.cpp"
846 ]
847 }
848 },
849 "Transpose": {
850 "files": {
851 "common": [
852 "src/gpu/cl/kernels/ClTransposeKernel.cpp",
853 "src/gpu/cl/operators/ClTranspose.cpp",
854 "src/runtime/CL/functions/CLTranspose.cpp"
855 ]
856 }
857 },
858 "Unstack": {
859 "deps": [ "StridedSlice" ],
860 "files": {
861 "common": [ "src/runtime/CL/functions/CLUnstack.cpp" ]
862 }
863 },
864 "YUVNormalize": {
865 "files": {
866 "common": [
867 "src/core/CL/kernels/CLNormalizePlanarYUVLayerKernel.cpp",
868 "src/runtime/CL/functions/CLNormalizePlanarYUVLayer.cpp"
869 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100870 }
Georgios Pinitasbdcdc392021-04-22 16:42:03 +0100871 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100872 }
873},
Michalis Spyrou20fca522021-06-07 14:23:57 +0100874 "cpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100875 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +0100876 "src/cpu/CpuContext.cpp",
877 "src/cpu/CpuQueue.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100878 "src/cpu/CpuTensor.cpp",
879 "src/core/NEON/kernels/NEFillBorderKernel.cpp",
880 "src/runtime/NEON/INEOperator.cpp",
881 "src/runtime/NEON/INESimpleFunction.cpp",
882 "src/runtime/NEON/INESimpleFunctionNoBorder.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100883 ],
884 "operators": {
885 "Activation": {
Viet-Hoa Dofd472f02023-03-15 14:05:06 +0000886 "deps": [ "LUT" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100887 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100888 "common": [
889 "src/cpu/operators/CpuActivation.cpp",
890 "src/cpu/kernels/CpuActivationKernel.cpp",
Dana Zlotnika538ae52022-02-21 13:12:41 +0200891 "src/runtime/NEON/functions/NEActivationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100892 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100893 "neon": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200894 "fp16": [ "src/cpu/kernels/activation/generic/neon/fp16.cpp" ],
ramelg01c827e992022-04-08 03:52:28 +0100895 "fp32": [ "src/cpu/kernels/activation/generic/neon/fp32.cpp" ],
Viet-Hoa Do29db3d22022-08-10 11:56:49 +0100896 "qasymm8": [
897 "src/cpu/kernels/activation/generic/neon/qasymm8.cpp",
898 "src/cpu/kernels/activation/generic/neon/lut.cpp"
899 ],
900 "qasymm8_signed": [
901 "src/cpu/kernels/activation/generic/neon/qasymm8_signed.cpp",
902 "src/cpu/kernels/activation/generic/neon/lut.cpp"
903 ],
Dana Zlotnika538ae52022-02-21 13:12:41 +0200904 "qsymm16": [ "src/cpu/kernels/activation/generic/neon/qsymm16.cpp" ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100905 },
906 "sve": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200907 "fp16": [ "src/cpu/kernels/activation/generic/sve/fp16.cpp" ],
SiCong Lic0463a22023-05-17 13:46:13 +0100908 "fp32": [ "src/cpu/kernels/activation/generic/sve/fp32.cpp" ]
ramelg01c827e992022-04-08 03:52:28 +0100909 },
alerah01c9e519d2022-01-31 19:04:10 +0200910 "sve2":{
SiCong Lic0463a22023-05-17 13:46:13 +0100911 "qasymm8": [
912 "src/cpu/kernels/activation/generic/sve2/qasymm8.cpp",
913 "src/cpu/kernels/activation/generic/sve2/lut.cpp"
914 ],
Dana Zlotnik32291712021-11-25 09:58:27 +0200915 "qasymm8_signed": [ "src/cpu/kernels/activation/generic/sve2/qasymm8_signed.cpp" ],
916 "qsymm16": [ "src/cpu/kernels/activation/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100917 }
918 }
919 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100920 "ArgMinMax": {
921 "deps": [ "Reduction" ],
922 "files": {
923 "common": [ "src/runtime/NEON/functions/NEArgMinMaxLayer.cpp" ]
924 }
925 },
Michalis Spyrou20fca522021-06-07 14:23:57 +0100926 "Add": {
927 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100928 "common": [
929 "src/cpu/operators/CpuAdd.cpp",
930 "src/cpu/kernels/CpuAddKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200931 "src/runtime/NEON/functions/NEArithmeticAddition.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100932 ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200933 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200934 "common": ["src/cpu/kernels/add/generic/neon/impl.cpp"],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200935 "fp32":["src/cpu/kernels/add/generic/neon/fp32.cpp"],
936 "fp16":["src/cpu/kernels/add/generic/neon/fp16.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200937 "integer":["src/cpu/kernels/add/generic/neon/integer.cpp"],
938 "qasymm8": ["src/cpu/kernels/add/generic/neon/qasymm8.cpp"],
939 "qasymm8_signed": ["src/cpu/kernels/add/generic/neon/qasymm8_signed.cpp"],
940 "qsymm16": ["src/cpu/kernels/add/generic/neon/qsymm16.cpp"]
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200941 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100942 "sve": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200943 "common": [ "src/cpu/kernels/add/generic/sve/impl.cpp" ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200944 "integer":["src/cpu/kernels/add/generic/sve/integer.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200945 "fp32":["src/cpu/kernels/add/generic/sve/fp32.cpp"],
946 "fp16":["src/cpu/kernels/add/generic/sve/fp16.cpp"]
947 },
948 "sve2": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200949 "qasymm8": [ "src/cpu/kernels/add/generic/sve2/qasymm8.cpp" ],
950 "qasymm8_signed": [ "src/cpu/kernels/add/generic/sve2/qasymm8_signed.cpp" ],
951 "qsymm16": [ "src/cpu/kernels/add/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100952 }
953 }
954 },
Gunes Bayirae72a462023-01-29 13:24:24 +0000955 "AddMulAdd": {
956 "files": {
957 "common": [
958 "src/cpu/operators/CpuAddMulAdd.cpp",
959 "src/cpu/kernels/CpuAddMulAddKernel.cpp",
960 "src/runtime/NEON/functions/NEAddMulAdd.cpp"
961 ],
962 "neon": {
963 "fp32":["src/cpu/kernels/addmuladd/generic/neon/fp32.cpp"],
964 "fp16":["src/cpu/kernels/addmuladd/generic/neon/fp16.cpp"],
965 "qasymm8": ["src/cpu/kernels/addmuladd/generic/neon/qasymm8.cpp"],
966 "qasymm8_signed": ["src/cpu/kernels/addmuladd/generic/neon/qasymm8_signed.cpp"]
967 }
968 }
969 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100970 "BatchNormalize": {
Michalis Spyrou20fca522021-06-07 14:23:57 +0100971 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100972 "common": [
973 "src/core/NEON/kernels/NEBatchNormalizationLayerKernel.cpp",
974 "src/core/NEON/kernels/NEFuseBatchNormalizationKernel.cpp",
975 "src/runtime/NEON/functions/NEBatchNormalizationLayer.cpp",
976 "src/runtime/NEON/functions/NEFuseBatchNormalization.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100977 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100978 "neon": {
Yair Schwarzbaum41a729e2021-11-15 20:42:47 +0200979 "common": [
Pablo Marquez Tello7e589802023-09-14 09:41:37 +0100980 "src/cpu/kernels/fuse_batch_normalization/nchw/all.cpp"
Yair Schwarzbaum41a729e2021-11-15 20:42:47 +0200981 ],
982 "fp16": [
983 "src/cpu/kernels/fuse_batch_normalization/generic/fp16.cpp",
984 "src/core/NEON/kernels/batchnormalization/impl/NEON/fp16.cpp",
Pablo Marquez Tello8d4cdd42023-11-21 10:10:01 +0000985 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp16.cpp",
986 "src/cpu/kernels/fuse_batch_normalization/nchw/neon/fp16.cpp"
987
Yair Schwarzbaum41a729e2021-11-15 20:42:47 +0200988 ],
989 "fp32": [
990 "src/cpu/kernels/fuse_batch_normalization/generic/fp32.cpp",
991 "src/core/NEON/kernels/batchnormalization/impl/NEON/fp32.cpp",
Pablo Marquez Tello8d4cdd42023-11-21 10:10:01 +0000992 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp32.cpp",
993 "src/cpu/kernels/fuse_batch_normalization/nchw/neon/fp32.cpp"
Yair Schwarzbaum41a729e2021-11-15 20:42:47 +0200994 ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100995 },
996 "sve": {
997 "fp16": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp16.cpp" ],
998 "fp32": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp32.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100999 }
1000 }
1001 },
1002 "BatchToSpace": {
1003 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001004 "common": [
1005 "src/core/NEON/kernels/NEBatchToSpaceLayerKernel.cpp",
1006 "src/runtime/NEON/functions/NEBatchToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001007 ]
1008 }
1009 },
1010 "BitwiseAnd": {
1011 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001012 "common": [
1013 "src/core/NEON/kernels/NEBitwiseAndKernel.cpp",
1014 "src/runtime/NEON/functions/NEBitwiseAnd.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001015 ]
1016 }
1017 },
1018 "BitwiseNot": {
1019 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001020 "common": [
1021 "src/core/NEON/kernels/NEBitwiseNotKernel.cpp",
1022 "src/runtime/NEON/functions/NEBitwiseNot.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001023 ]
1024 }
1025 },
1026 "BitwiseOr": {
1027 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001028 "common": [
1029 "src/core/NEON/kernels/NEBitwiseOrKernel.cpp",
1030 "src/runtime/NEON/functions/NEBitwiseOr.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001031 ]
1032 }
1033 },
1034 "BitwiseXor": {
1035 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001036 "common": [
1037 "src/core/NEON/kernels/NEBitwiseXorKernel.cpp",
1038 "src/runtime/NEON/functions/NEBitwiseXor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001039 ]
1040 }
1041 },
1042 "BoundingBoxTransform": {
1043 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001044 "common": [
1045 "src/core/NEON/kernels/NEBoundingBoxTransformKernel.cpp",
1046 "src/runtime/NEON/functions/NEBoundingBoxTransform.cpp"
Dana Zlotnik3475ffe2022-01-03 14:37:10 +02001047 ],
1048 "neon":{
1049 "common":["src/cpu/kernels/boundingboxtransform/generic/neon/impl.cpp"],
1050 "fp32":["src/cpu/kernels/boundingboxtransform/generic/neon/fp32.cpp"],
1051 "fp16":["src/cpu/kernels/boundingboxtransform/generic/neon/fp16.cpp"],
1052 "qsymm16":["src/cpu/kernels/boundingboxtransform/generic/neon/qsymm16.cpp"]
Dana Zlotnik3475ffe2022-01-03 14:37:10 +02001053 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001054 }
1055 },
1056 "Cast": {
1057 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001058 "common": [
1059 "src/cpu/operators/CpuCast.cpp",
1060 "src/cpu/kernels/CpuCastKernel.cpp",
Adnan AlSinan40a9d3e2023-09-15 13:46:17 +01001061 "src/runtime/NEON/functions/NECast.cpp"
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +02001062 ],
1063 "neon":{
1064 "fp16":["src/cpu/kernels/cast/generic/neon/fp16.cpp"]
1065 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001066 }
1067 },
1068 "ChannelShuffle": {
1069 "files": {
1070 "common": [
1071 "src/core/NEON/kernels/NEChannelShuffleLayerKernel.cpp",
1072 "src/runtime/NEON/functions/NEChannelShuffleLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001073 ]
1074 }
1075 },
1076 "Concatenate": {
1077 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001078 "common": [
1079 "src/cpu/operators/CpuConcatenate.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001080 "src/cpu/kernels/CpuConcatenateWidthKernel.cpp",
1081 "src/cpu/kernels/CpuConcatenateBatchKernel.cpp",
1082 "src/cpu/kernels/CpuConcatenateDepthKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001083 "src/cpu/kernels/CpuConcatenateHeightKernel.cpp",
1084 "src/runtime/NEON/functions/NEConcatenateLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001085 ]
1086 }
1087 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001088 "Conv2d": {
1089 "deps": [
1090 "Activation",
1091 "ElementwiseBinary",
1092 "FFT2D",
1093 "Gemm",
1094 "Mul",
1095 "Pad",
1096 "Permute",
1097 "Reshape",
1098 "Reverse",
1099 "Slice"
1100 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001101 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001102 "common": [
1103 "src/cpu/operators/CpuConv2d.cpp",
1104 "src/cpu/operators/CpuDirectConv2d.cpp",
1105 "src/cpu/operators/CpuGemmDirectConv2d.cpp",
1106 "src/cpu/operators/CpuGemmConv2d.cpp",
1107 "src/cpu/operators/CpuWinogradConv2d.cpp",
1108 "src/cpu/operators/internal/CpuGemmAssemblyDispatch.cpp",
1109 "src/cpu/kernels/CpuDirectConv2dKernel.cpp",
1110 "src/cpu/kernels/CpuDirectConv2dOutputStageKernel.cpp",
1111 "src/cpu/kernels/CpuWinogradConv2dKernel.cpp",
1112 "src/cpu/kernels/CpuCol2ImKernel.cpp",
1113 "src/cpu/kernels/CpuIm2ColKernel.cpp",
1114 "src/cpu/kernels/CpuWeightsReshapeKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001115 "src/runtime/NEON/functions/NEConvolutionLayer.cpp",
1116 "src/runtime/NEON/functions/NEDirectConvolutionLayer.cpp",
1117 "src/runtime/NEON/functions/NEFFTConvolutionLayer.cpp",
1118 "src/runtime/NEON/functions/NEGEMMConv2d.cpp",
1119 "src/runtime/NEON/functions/NEGEMMConvolutionLayer.cpp",
1120 "src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001121 ],
1122 "neon": {
1123 "common": [
1124 "src/core/NEON/kernels/convolution/common/padding.cpp",
1125 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1126 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1127 "src/core/NEON/kernels/convolution/common/utils.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001128 "src/core/NEON/kernels/convolution/winograd/input_transforms_fp16.cpp",
1129 "src/core/NEON/kernels/convolution/winograd/input_transforms_fp32.cpp",
1130 "src/core/NEON/kernels/convolution/winograd/output_transforms_fp16.cpp",
1131 "src/core/NEON/kernels/convolution/winograd/output_transforms_fp32.cpp",
1132 "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp16.cpp",
1133 "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp32.cpp",
1134 "src/core/NEON/kernels/convolution/winograd/winograd_fp16.cpp",
1135 "src/core/NEON/kernels/convolution/winograd/winograd_fp32.cpp",
1136 "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp16_6x6.cpp",
1137 "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp32_6x6.cpp",
1138 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_1x8.cpp",
1139 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_4x4.cpp",
1140 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_6x6.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001141 "src/core/NEON/kernels/convolution/winograd/output_transforms/a64_fp16_4x4_3x3.cpp",
1142 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x2_1x7.cpp",
1143 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x4_1x5.cpp",
1144 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x6_1x3.cpp",
1145 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_3x3.cpp",
1146 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_5x5.cpp",
1147 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_4x4_3x3.cpp",
1148 "src/core/NEON/kernels/convolution/winograd/weight_transforms/a64_fp16_4x4_3x3.cpp",
1149 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_3x3.cpp",
1150 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_5x5.cpp",
1151 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_4x4_3x3.cpp",
1152 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x2_1x7.cpp",
1153 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x4_1x5.cpp",
1154 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x6_1x3.cpp",
alerah01c9e519d2022-01-31 19:04:10 +02001155 "src/cpu/kernels/directconv2d/nhwc/neon/impl.cpp",
Pablo Marquez Telloe5362e72023-10-16 14:14:14 +01001156 "src/cpu/kernels/directconv2d/nhwc/neon/qasymm8.cpp",
alerah01c9e519d2022-01-31 19:04:10 +02001157 "src/cpu/kernels/directconv2d/nchw/all.cpp"
Pablo Marquez Telloe5362e72023-10-16 14:14:14 +01001158
alerah01c9e519d2022-01-31 19:04:10 +02001159 ],
1160 "fp32": [
1161 "src/cpu/kernels/directconv2d/nhwc/neon/fp32.cpp"
Pablo Marquez Telloe5362e72023-10-16 14:14:14 +01001162 ],
1163 "fp16": [
1164 "src/cpu/kernels/directconv2d/nchw/fp16.cpp",
1165 "src/cpu/kernels/directconv2d/nhwc/neon/fp16.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001166 ]
ramelg0199c46472022-07-15 13:08:39 +01001167 },
1168 "sve": {
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001169 "common": [
1170 "src/core/NEON/kernels/convolution/winograd/input_transforms/sve_fp32_6x6.cpp",
1171 "src/core/NEON/kernels/convolution/winograd/input_transforms/sme_fp32_mla_6x6.cpp",
1172 "src/core/NEON/kernels/convolution/winograd/output_transforms/sme_fp32_mopa_4x4_3x3.cpp"
1173 ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001174 }
Michalis Spyroub55f8e82021-07-22 11:23:11 +01001175 }
1176 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001177 "Copy": {
1178 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001179 "common": [
1180 "src/cpu/operators/CpuCopy.cpp",
1181 "src/cpu/kernels/CpuCopyKernel.cpp",
1182 "src/runtime/NEON/functions/NECopy.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001183 ]
1184 }
1185 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001186 "CropResize": {
1187 "deps": [ "Scale" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001188 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001189 "common": [
1190 "src/core/NEON/kernels/NECropKernel.cpp",
1191 "src/runtime/NEON/functions/NECropResize.cpp"
alerah0127619932021-11-24 17:21:43 +02001192 ],
1193 "neon": {
alerah0127619932021-11-24 17:21:43 +02001194 "fp32": [ "src/cpu/kernels/crop/generic/neon/fp32.cpp" ],
1195 "fp16": [ "src/cpu/kernels/crop/generic/neon/fp16.cpp" ],
1196 "integer": [ "src/cpu/kernels/crop/generic/neon/integer.cpp" ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001197 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001198 }
1199 },
1200 "Deconv2d": {
1201 "deps": [ "Conv2d", "Reverse", "Transpose"],
1202 "files": {
1203 "common": [
1204 "src/runtime/NEON/functions/NEDeconvolutionLayer.cpp"
1205 ]
1206 }
1207 },
1208 "DepthConvert": {
1209 "deps": [ "Cast"],
1210 "files": {
1211 "common": [
1212 "src/runtime/NEON/functions/NEDepthConvertLayer.cpp"
1213 ]
1214 }
1215 },
1216 "DepthToSpace": {
1217 "files": {
1218 "common": [
1219 "src/core/NEON/kernels/NEDepthToSpaceLayerKernel.cpp",
Viet-Hoa Do47370942023-11-13 17:20:45 +00001220 "src/runtime/NEON/functions/NEDepthToSpaceLayer.cpp",
1221 "src/cpu/kernels/depth_to_space/nhwc/any/impl.cpp",
1222 "src/cpu/kernels/depth_to_space/nchw/any/impl.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001223 ]
1224 }
1225 },
1226 "DepthwiseConv2d": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001227 "deps": [ "Activation", "Permute" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001228 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001229 "common": [
Georgios Pinitas7891a732021-08-20 21:39:25 +01001230 "src/cpu/operators/CpuDepthwiseConv2d.cpp",
1231 "src/cpu/operators/CpuDepthwiseConv2dAssemblyDispatch.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001232 "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.cpp",
1233 "src/cpu/kernels/internal/CpuDepthwiseConv2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001234 "src/runtime/NEON/functions/NEDepthwiseConvolutionLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001235 ],
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001236 "neon": {
1237 "common": [
1238 "src/core/NEON/kernels/convolution/common/padding.cpp",
1239 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1240 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1241 "src/core/NEON/kernels/convolution/common/utils.cpp",
ramelg01c827e992022-04-08 03:52:28 +01001242 "src/core/NEON/kernels/arm_conv/addressing.cpp",
Pablo Marquez Tello4e2bbbb2023-01-09 17:21:01 +00001243 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_common.cpp",
ramelg018a164882022-04-07 02:42:52 +01001244 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_strategies_common.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001245 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8q.cpp",
1246 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8s8u8q.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001247 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_s8q.cpp",
1248 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp32.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001249 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1250 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1251 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1252 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1253 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1254 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1255 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1256 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1257 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1258 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001259 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1260 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1261 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1262 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1263 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1264 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1265 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1266 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1267 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1268 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1269 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1270 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1271 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1272 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1273 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1274 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1275 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1276 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1277 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1278 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1279 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1280 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1281 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1282 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1283 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1284 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
ramelg018a164882022-04-07 02:42:52 +01001285 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1286 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1287 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001288 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_s8q_3x3_dot.cpp",
ramelg01c827e992022-04-08 03:52:28 +01001289 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_u8q_3x3_dot.cpp",
ramelg018a164882022-04-07 02:42:52 +01001290 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic.cpp",
1291 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic_quantized_dot_product.cpp",
Michael Tyler8deee9b2023-06-30 11:26:05 +01001292 "src/core/NEON/kernels/arm_conv/depthwise/premultiply.cpp",
Dana Zlotnikebbae942022-02-03 12:52:15 +02001293 "src/cpu/kernels/depthwiseconv2d/generic/neon/impl.cpp"
ramelg01a1f78512022-06-29 16:28:10 +01001294 ],
Pablo Marquez Tello64f4a302023-11-06 15:15:53 +00001295 "fp16":[
1296 "src/cpu/kernels/depthwiseconv2d/generic/neon/fp16.cpp",
1297 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp16.cpp",
1298 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1299 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1300 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1301 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1302 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1303 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1304 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1305 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1306 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1307 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1308 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1309 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_generic_output9_mla_depthfirst/generic.cpp"
1310 ],
ramelg01a1f78512022-06-29 16:28:10 +01001311 "fp32":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp32.cpp"],
1312 "qasymm8":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8.cpp"],
Dana Zlotnikebbae942022-02-03 12:52:15 +02001313 "qasymm8_signed":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8_signed.cpp"]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001314 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001315 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001316 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001317 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_s8q_3x3_dot.cpp",
1318 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_u8q_3x3_dot.cpp",
1319 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1320 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1321 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1322 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1323 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1324 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1325 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1326 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1327 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1328 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001329 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1330 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001331 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1332 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1333 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1334 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1335 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1336 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1337 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1338 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1339 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1340 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1341 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1342 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1343 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1344 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1345 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1346 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1347 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1348 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1349 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1350 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1351 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1352 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1353 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1354 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1355 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1356 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1357 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001358 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
David Mansellb2758f32023-03-30 19:10:52 +01001359 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1360 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1361 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1362 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1363 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1364 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1365 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1366 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1367 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1368 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001369 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1370 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1371 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1372 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1373 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1374 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1375 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1376 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1377 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s1_4rows_mla_za/generic.cpp",
1378 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s2_4rows_mla_za/generic.cpp",
1379 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s1_4rows_mla_za/generic.cpp",
1380 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s2_4rows_mla_za/generic.cpp",
1381 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za/generic.cpp",
1382 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za/generic.cpp",
1383 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za/generic.cpp",
1384 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za/generic.cpp",
1385 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001386 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1387 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1388 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1389 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001390 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1391 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1392 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1393 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001394 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1395 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1396 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001397 ]
1398 }
1399 }
1400 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001401 "Dequantize": {
1402 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001403 "common": [
1404 "src/cpu/operators/CpuDequantize.cpp",
1405 "src/cpu/kernels/CpuDequantizeKernel.cpp",
1406 "src/runtime/NEON/functions/NEDequantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001407 ]
1408 }
1409 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001410 "DetectionPostProcess": {
1411 "deps": [ "Dequantize" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001412 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001413 "common" : [ "src/runtime/NEON/functions/NEDetectionPostProcessLayer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001414 }
1415 },
Sheri Zhang6d9c9822021-09-24 16:02:57 +01001416 "Conv3d": {
1417 "deps": [
1418 "Activation"
1419 ],
1420 "files": {
1421 "common": [
1422 "src/cpu/operators/CpuDirectConv3d.cpp",
1423 "src/cpu/kernels/CpuDirectConv3dKernel.cpp",
1424 "src/runtime/NEON/functions/NEConv3D.cpp"
1425 ]
1426 }
1427 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001428 "ElementwiseBinary": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001429 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001430 "common": [
1431 "src/cpu/operators/CpuElementwise.cpp",
1432 "src/cpu/kernels/CpuElementwiseKernel.cpp",
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001433 "src/runtime/NEON/functions/NEElementwiseOperations.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001434 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001435 "neon":{
1436 "fp32": ["src/cpu/kernels/elementwise_binary/generic/neon/fp32.cpp"],
1437 "fp16": ["src/cpu/kernels/elementwise_binary/generic/neon/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001438 "integer": ["src/cpu/kernels/elementwise_binary/generic/neon/integer.cpp"],
1439 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8.cpp"],
1440 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001441 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001442 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001443 "common": ["src/cpu/kernels/elementwise_binary/generic/sve/impl.cpp" ],
1444 "integer": ["src/cpu/kernels/elementwise_binary/generic/sve/integer.cpp"],
1445 "fp32": ["src/cpu/kernels/elementwise_binary/generic/sve/fp32.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001446 "fp16": ["src/cpu/kernels/elementwise_binary/generic/sve/fp16.cpp"]
1447
ramelg01a1f78512022-06-29 16:28:10 +01001448 },
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001449 "sve2":{
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001450 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8.cpp"],
1451 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001452 }
1453 }
1454 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001455 "ElementwiseUnary":{
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001456 "deps": [ "LUT" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001457 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001458 "common": [
1459 "src/cpu/operators/CpuElementwiseUnary.cpp",
1460 "src/cpu/kernels/CpuElementwiseUnaryKernel.cpp",
1461 "src/runtime/NEON/functions/NEElementwiseUnaryLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001462 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001463 "neon": {
1464 "integer": ["src/cpu/kernels/elementwise_unary/generic/neon/integer.cpp"],
1465 "fp32": ["src/cpu/kernels/elementwise_unary/generic/neon/fp32.cpp"],
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001466 "fp16": ["src/cpu/kernels/elementwise_unary/generic/neon/fp16.cpp"],
Ramy Elgammal8b7f42a2023-03-31 16:16:15 +01001467 "qasymm8": [
1468 "src/cpu/kernels/elementwise_unary/generic/neon/q8.cpp",
1469 "src/cpu/kernels/elementwise_unary/generic/neon/qasymm8.cpp"
1470 ],
1471 "qasymm8_signed": [
1472 "src/cpu/kernels/elementwise_unary/generic/neon/q8.cpp",
1473 "src/cpu/kernels/elementwise_unary/generic/neon/qasymm8_signed.cpp"
1474 ]
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001475 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001476 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001477 "common": ["src/cpu/kernels/elementwise_unary/generic/sve/impl.cpp" ],
1478 "integer": ["src/cpu/kernels/elementwise_unary/generic/sve/integer.cpp"],
1479 "fp32": ["src/cpu/kernels/elementwise_unary/generic/sve/fp32.cpp"],
SiCong Lic0463a22023-05-17 13:46:13 +01001480 "fp16": ["src/cpu/kernels/elementwise_unary/generic/sve/fp16.cpp"]
1481 },
1482 "sve2": {
1483 "qasymm8": ["src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp"],
1484 "qasymm8_signed": ["src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001485 }
1486 }
1487 },
1488 "FFT1D": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001489 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001490 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001491 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001492 "src/core/NEON/kernels/NEFFTDigitReverseKernel.cpp",
1493 "src/core/NEON/kernels/NEFFTRadixStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001494 "src/core/NEON/kernels/NEFFTScaleKernel.cpp",
1495 "src/runtime/NEON/functions/NEFFT1D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001496 ]
1497 }
1498 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001499 "FFT2D": {
1500 "deps": [ "FFT1D" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001501 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001502 "common": [
1503 "src/runtime/NEON/functions/NEFFT2D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001504 ]
1505 }
1506 },
1507 "Fill": {
1508 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001509 "common": [
1510 "src/cpu/operators/CpuFill.cpp",
1511 "src/cpu/kernels/CpuFillKernel.cpp",
1512 "src/runtime/NEON/functions/NEFill.cpp"
1513 ]
1514 }
1515 },
1516 "Flatten": {
1517 "deps: ": [ "Reshape" ],
1518 "files": {
1519 "common": [
1520 "src/cpu/operators/CpuFlatten.cpp",
1521 "src/runtime/NEON/functions/NEFlattenLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001522 ]
1523 }
1524 },
1525 "Floor": {
1526 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001527 "common": [
1528 "src/cpu/operators/CpuFloor.cpp",
1529 "src/cpu/kernels/CpuFloorKernel.cpp",
1530 "src/runtime/NEON/functions/NEFloor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001531 ],
1532 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001533 "fp32": [ "src/cpu/kernels/floor/neon/fp32.cpp" ],
1534 "fp16": [ "src/cpu/kernels/floor/neon/fp16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001535 }
1536 }
1537 },
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001538 "FullyConnected": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001539 "deps": [ "Flatten", "Gemm", "Transpose"],
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001540 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001541 "common": [
1542 "src/cpu/kernels/CpuConvertFullyConnectedWeightsKernel.cpp",
1543 "src/cpu/operators/CpuConvertFullyConnectedWeights.cpp",
1544 "src/cpu/operators/CpuFullyConnected.cpp",
1545 "src/runtime/NEON/functions/NEConvertFullyConnectedWeights.cpp",
1546 "src/runtime/NEON/functions/NEFullyConnectedLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001547 ]
1548 }
1549 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001550 "Gather": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001551 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001552 "common": [
1553 "src/core/NEON/kernels/NEGatherKernel.cpp",
1554 "src/runtime/NEON/functions/NEGather.cpp"
1555 ]
1556 }
1557 },
1558 "Gemm": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001559 "deps": [ "Quantize", "Add"],
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001560 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001561 "common": [
1562 "src/cpu/kernels/CpuConvertQuantizedSignednessKernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001563 "src/cpu/kernels/CpuGemmMatrixAdditionKernel.cpp",
1564 "src/cpu/kernels/CpuGemmMatrixMultiplyKernel.cpp",
1565 "src/cpu/kernels/CpuGemmTranspose1xWKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001566 "src/cpu/kernels/CpuGemmInterleave4x4Kernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001567 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ScaleKernel.cpp",
1568 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt16ScaleByFixedPointKernel.cpp",
1569 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt8ScaleByFixedPointKernel.cpp",
1570 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToUint8ScaleByFixedPointKernel.cpp",
1571 "src/cpu/kernels/CpuGemmLowpMatrixMultiplyKernel.cpp",
1572 "src/cpu/kernels/CpuGemmLowpMatrixReductionKernel.cpp",
1573 "src/cpu/kernels/CpuGemmLowpOffsetContributionOutputStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001574 "src/cpu/kernels/CpuGemmLowpOffsetContributionKernel.cpp",
1575 "src/cpu/operators/CpuGemm.cpp",
1576 "src/cpu/operators/CpuGemmLowpOutputStage.cpp",
1577 "src/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001578 "src/runtime/NEON/functions/NEGEMM.cpp",
1579 "src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001580 "src/runtime/NEON/functions/NEGEMMLowpOutputStage.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001581 ],
1582 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001583 "common": [
1584 "src/core/NEON/kernels/arm_gemm/gemm_bf16.cpp",
1585 "src/core/NEON/kernels/arm_gemm/gemm_fp16.cpp",
1586 "src/core/NEON/kernels/arm_gemm/gemm_fp32.cpp",
1587 "src/core/NEON/kernels/arm_gemm/gemm_int16.cpp",
1588 "src/core/NEON/kernels/arm_gemm/gemm_int8.cpp",
1589 "src/core/NEON/kernels/arm_gemm/gemm_qint8.cpp",
1590 "src/core/NEON/kernels/arm_gemm/gemm_quint8.cpp",
1591 "src/core/NEON/kernels/arm_gemm/gemm_uint16.cpp",
1592 "src/core/NEON/kernels/arm_gemm/gemm_uint8.cpp",
1593 "src/core/NEON/kernels/arm_gemm/interleave_indirect.cpp",
1594 "src/core/NEON/kernels/arm_gemm/mergeresults-fp16.cpp",
1595 "src/core/NEON/kernels/arm_gemm/mergeresults.cpp",
1596 "src/core/NEON/kernels/arm_gemm/misc.cpp",
1597 "src/core/NEON/kernels/arm_gemm/quantized.cpp",
1598 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_s8.cpp",
1599 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_u8.cpp",
1600 "src/core/NEON/kernels/arm_gemm/transform.cpp",
1601 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s16_8x12/generic.cpp",
1602 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_4x4/generic.cpp",
1603 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/a55r1.cpp",
1604 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/generic.cpp",
1605 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/x1.cpp",
1606 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u16_8x12/generic.cpp",
1607 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4/generic.cpp",
1608 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/a55r1.cpp",
1609 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/generic.cpp",
1610 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/x1.cpp",
1611 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/a55r1.cpp",
1612 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/generic.cpp",
1613 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/x1.cpp",
1614 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_dot_6x16/generic.cpp",
1615 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_mmla_6x16/generic.cpp",
1616 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/a55.cpp",
1617 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/generic.cpp",
1618 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/a55.cpp",
1619 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/generic.cpp",
1620 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/a55.cpp",
1621 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/generic.cpp",
1622 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/a55.cpp",
1623 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/generic.cpp",
1624 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1625 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_6x16/generic.cpp",
1626 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/a55.cpp",
1627 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/generic.cpp",
1628 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_mmla_4x16/generic.cpp",
1629 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/a55.cpp",
1630 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/generic.cpp",
1631 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_mmla_6x16/generic.cpp",
1632 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/a55.cpp",
1633 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/generic.cpp",
1634 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_mmla_6x16/generic.cpp",
1635 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/a55.cpp",
1636 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/generic.cpp",
1637 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_mmla_4x16/generic.cpp",
1638 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/a55.cpp",
1639 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/generic.cpp",
1640 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_mmla_6x16/generic.cpp",
1641 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/generic.cpp",
1642 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/x1.cpp",
1643 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/generic.cpp",
1644 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/a510.cpp",
1645 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/generic.cpp",
1646 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/a510.cpp",
1647 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/generic.cpp",
1648 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/a510.cpp",
1649 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a53.cpp",
1650 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55.cpp",
1651 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55r1.cpp",
1652 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/generic.cpp",
1653 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/x1.cpp",
1654 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x6/generic.cpp",
1655 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_6x4/generic.cpp",
1656 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_8x4/generic.cpp",
1657 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/a55.cpp",
1658 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/generic.cpp",
1659 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/a55.cpp",
1660 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/generic.cpp",
1661 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/a55.cpp",
1662 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/generic.cpp",
1663 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/a55.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001664 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/generic.cpp",
Dana Zlotnik256ac622022-02-02 15:06:11 +02001665 "src/cpu/kernels/gemm_matrix_mul/generic/neon/impl.cpp",
1666 "src/cpu/kernels/gemm_matrix_add/generic/neon/impl.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001667 ],
Dana Zlotnik256ac622022-02-02 15:06:11 +02001668 "fp32":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp32.cpp",
1669 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp32.cpp"],
1670 "fp16":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp16.cpp",
1671 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp16.cpp"],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001672 "estate32": [
1673 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a53.cpp",
1674 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a55r1.cpp",
1675 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/generic.cpp"
1676 ],
1677 "estate64": [
Freddie Liardet487d3902021-09-21 12:36:43 +01001678 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemv_pretransposed/generic.cpp"
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001679 ],
Nathan John Sircombed7113e42023-04-26 15:02:43 +01001680 "fixed_format_kernels": [
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001681 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_bf16fp32_mmla_6x16/generic.cpp",
1682 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp16_mla_6x32/generic.cpp",
1683 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32_mla_6x16/generic.cpp",
1684 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1685 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_dot_8x12/generic.cpp",
1686 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_mmla_8x12/generic.cpp",
1687 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp16_mla_8x24/generic.cpp",
1688 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp32_mla_8x12/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001689 ]
1690 },
1691 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001692 "common": [
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001693 "src/core/NEON/kernels/arm_gemm/interleave_indirect-sve.cpp",
1694 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_bf16fp32_dot_16VL/generic.cpp",
David Mansell0fa92b82023-10-17 13:33:24 +01001695 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp16fp32fp16_dot_16VL/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001696 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32_mla_16VL/generic.cpp",
1697 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32bf16fp32_dot_16VL/generic.cpp",
1698 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_s8qa_dot_16VL/generic.cpp",
1699 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_u8qa_dot_16VL/generic.cpp",
1700 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_1VLx4VL/generic.cpp",
1701 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_2VLx2VL/generic.cpp",
1702 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_4VLx1VL/generic.cpp",
David Mansellaaa9da12023-03-10 13:48:50 +00001703 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_1VLx4VL/generic.cpp",
1704 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_2VLx2VL/generic.cpp",
1705 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_4VLx1VL/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001706 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_1VLx4VL/generic.cpp",
1707 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_2VLx2VL/generic.cpp",
1708 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_4VLx1VL/generic.cpp",
1709 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_1VLx4VL/generic.cpp",
1710 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_2VLx2VL/generic.cpp",
1711 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_4VLx1VL/generic.cpp",
1712 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_1VLx4VL/generic.cpp",
1713 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_2VLx2VL/generic.cpp",
1714 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_4VLx1VL/generic.cpp",
1715 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_1VLx4VL/generic.cpp",
1716 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_2VLx2VL/generic.cpp",
1717 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_4VLx1VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001718 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001719 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1720 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001721 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001722 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001723 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001724 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001725 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001726 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1727 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001728 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001729 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_mmla_4x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001730 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001731 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_mmla_6x4VL/generic.cpp",
1732 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001733 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001734 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001735 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001736 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_mmla_4x4VL/generic.cpp",
1737 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001738 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001739 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001740 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_dot_8x3VL/generic.cpp",
1741 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001742 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001743 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001744 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001745 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/generic.cpp",
1746 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001747 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001748 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/generic.cpp",
1749 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001750 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001751 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/generic.cpp",
1752 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001753 "src/core/NEON/kernels/arm_gemm/mergeresults-sve.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001754 "src/core/NEON/kernels/arm_gemm/transform-sve.cpp",
1755 "src/core/NEON/kernels/arm_gemm/misc-sve.cpp"
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001756 ],
Nathan John Sircombed7113e42023-04-26 15:02:43 +01001757 "fixed_format_kernels": [
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001758 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1759 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/a64fx.cpp",
1760 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/generic.cpp",
1761 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/a64fx.cpp",
1762 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/generic.cpp",
1763 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1764 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_bf16fp32_mmla_8x3VL/generic.cpp",
1765 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/a64fx.cpp",
1766 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/generic.cpp",
1767 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/a64fx.cpp",
1768 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/generic.cpp"
1769 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001770 }
1771 }
1772 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001773 "GenerateProposals": {
1774 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001775 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001776 "common": [
1777 "src/core/NEON/kernels/NEGenerateProposalsLayerKernel.cpp",
1778 "src/runtime/NEON/functions/NEGenerateProposalsLayer.cpp"
Dana Zlotnik50ce2772021-12-29 13:55:56 +02001779 ],
1780 "neon":{
1781 "common":["src/cpu/kernels/genproposals/generic/neon/impl.cpp"],
1782 "fp16":["src/cpu/kernels/genproposals/generic/neon/fp16.cpp"],
1783 "fp32":["src/cpu/kernels/genproposals/generic/neon/fp32.cpp"],
1784 "qsymm16":["src/cpu/kernels/genproposals/generic/neon/qsymm16.cpp"]
1785 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001786 }
1787 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001788 "InstanceNormalize": {
1789 "deps": [ "Permute", "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001790 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001791 "common": [
1792 "src/core/NEON/kernels/NEInstanceNormalizationLayerKernel.cpp",
1793 "src/runtime/NEON/functions/NEInstanceNormalizationLayer.cpp"
ramelg01a1f78512022-06-29 16:28:10 +01001794 ],
Dana Zlotnikd7e2ec52022-01-03 10:59:41 +02001795 "neon":{
1796 "common":["src/cpu/kernels/instancenorm/generic/neon/impl.cpp"],
1797 "fp16":["src/cpu/kernels/instancenorm/generic/neon/fp16.cpp"],
1798 "fp32":["src/cpu/kernels/instancenorm/generic/neon/fp32.cpp"]
1799 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001800 }
1801 },
1802 "L2Normalize": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001803 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001804 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001805 "common": [
1806 "src/core/NEON/kernels/NEL2NormalizeLayerKernel.cpp",
1807 "src/runtime/NEON/functions/NEL2NormalizeLayer.cpp"
Yair Schwarzbaum5e993182022-01-10 15:11:07 +02001808 ],
1809 "neon":{
Yair Schwarzbaum5e993182022-01-10 15:11:07 +02001810 "fp32":["src/cpu/kernels/l2normlayer/generic/neon/fp32.cpp"],
1811 "fp16":["src/cpu/kernels/l2normlayer/generic/neon/fp16.cpp"]
1812 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001813 }
1814 },
1815 "Logical": {
1816 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001817 "common": [
1818 "src/core/NEON/kernels/NELogicalKernel.cpp",
1819 "src/runtime/NEON/functions/NELogical.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001820 ]
1821 }
1822 },
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001823 "LUT": {
1824 "files": {
1825 "common": [],
1826 "neon":{
1827 "qasymm8": ["src/cpu/kernels/lut/generic/neon/u8.cpp"],
1828 "qasymm8_signed": ["src/cpu/kernels/lut/generic/neon/u8.cpp"]
1829 },
SiCong Lic0463a22023-05-17 13:46:13 +01001830 "sve2": {
1831 "qasymm8": ["src/cpu/kernels/lut/generic/sve2/u8.cpp"],
1832 "qasymm8_signed": ["src/cpu/kernels/lut/generic/sve2/u8.cpp"]
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001833 }
1834 }
1835 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001836 "LSTM": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001837 "deps": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001838 "Activation",
1839 "Concatenate",
1840 "Copy",
1841 "Dequantize",
1842 "ElementwiseBinary",
1843 "Fill",
1844 "FullyConnected",
1845 "Gemm",
1846 "MeanStdDevNormalize",
1847 "Mul",
1848 "Quantize",
1849 "Slice",
1850 "Transpose"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001851 ],
1852 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001853 "common": [
1854 "src/core/NEON/kernels/NEQLSTMLayerNormalizationKernel.cpp",
1855 "src/runtime/NEON/functions/NELSTMLayer.cpp",
1856 "src/runtime/NEON/functions/NELSTMLayerQuantized.cpp",
1857 "src/runtime/NEON/functions/NEQLSTMLayer.cpp"
1858 ]
1859 }
1860 },
1861 "MaxUnpool2d": {
1862 "deps": [ "Fill" ],
1863 "files": {
1864 "common": [
Dana Zlotnik149203b2022-01-26 12:38:03 +02001865 "src/cpu/kernels/CpuMaxUnpoolingLayerKernel.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001866 "src/runtime/NEON/functions/NEMaxUnpoolingLayer.cpp",
Dana Zlotnik149203b2022-01-26 12:38:03 +02001867 "src/cpu/operators/CpuMaxUnpooling.cpp"
Dana Zlotnik143310c2021-12-30 13:24:52 +02001868 ],
1869 "neon":{
Dana Zlotnik143310c2021-12-30 13:24:52 +02001870 "fp32":["src/cpu/kernels/maxunpool/generic/neon/fp32.cpp"],
1871 "fp16":["src/cpu/kernels/maxunpool/generic/neon/fp16.cpp"],
1872 "qasymm8":["src/cpu/kernels/maxunpool/generic/neon/qasymm8.cpp"],
Pablo Marquez Tello6b6ba9e2023-09-22 14:36:03 +01001873 "qasymm8_signed":[ "src/cpu/kernels/maxunpool/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnik143310c2021-12-30 13:24:52 +02001874 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001875 }
1876 },
1877 "Mean": {
1878 "deps" : [ "Reduction" ],
1879 "files": {
1880 "common": [ "src/runtime/NEON/functions/NEReduceMean.cpp" ]
1881 }
1882 },
1883 "MeanStdDevNormalize": {
1884 "files": {
1885 "common": [
1886 "src/core/NEON/kernels/NEMeanStdDevNormalizationKernel.cpp",
1887 "src/runtime/NEON/functions/NEMeanStdDevNormalizationLayer.cpp"
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001888 ],
1889 "neon":{
1890 "common":["src/cpu/kernels/meanstddevnorm/generic/neon/impl.cpp"],
1891 "fp32":["src/cpu/kernels/meanstddevnorm/generic/neon/fp32.cpp"],
Murray Kornelsen6e09e142022-07-13 21:40:26 -04001892 "fp16":["src/cpu/kernels/meanstddevnorm/generic/neon/fp16.cpp"],
1893 "qasymm8":["src/cpu/kernels/meanstddevnorm/generic/neon/qasymm8.cpp"]
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001894 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001895 }
1896 },
Mohammed Suhail Munshia1b1e412023-03-23 22:21:31 +00001897 "MatMul" : {
Viet-Hoa Do99b6fd22023-04-27 17:06:10 +01001898 "deps": [ "Transpose" ],
Mohammed Suhail Munshia1b1e412023-03-23 22:21:31 +00001899 "files": {
1900 "common": [
1901 "src/cpu/operators/CpuMatMul.cpp",
1902 "src/runtime/NEON/functions/NEMatMul.cpp"
1903 ]
1904 }
1905 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001906 "Mul": {
1907 "files": {
1908 "common": [
1909 "src/cpu/operators/CpuMul.cpp",
1910 "src/cpu/kernels/CpuMulKernel.cpp",
1911 "src/runtime/NEON/functions/NEPixelWiseMultiplication.cpp"
Pablo Marquez Tello568aab62023-11-20 14:20:01 +00001912 ],
1913 "neon":{
1914 "fp16":["src/cpu/kernels/mul/generic/neon/fp16.cpp"],
1915 "fp32":["src/cpu/kernels/mul/generic/neon/fp32.cpp"]
1916 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001917 }
1918 },
1919 "Normalize": {
1920 "deps": [ "Mul" ],
1921 "files": {
1922 "common": [
1923 "src/core/NEON/kernels/NENormalizationLayerKernel.cpp",
1924 "src/runtime/NEON/functions/NENormalizationLayer.cpp"
Pablo Marquez Telloba933712023-11-13 15:57:54 +00001925 ],
1926 "neon":{
1927 "fp16":["src/cpu/kernels/norm_layer/generic/neon/fp16.cpp"],
1928 "fp32":["src/cpu/kernels/norm_layer/generic/neon/fp32.cpp"]
1929 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001930 }
1931 },
1932 "Pad": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001933 "deps": [ "Concatenate", "Copy", "StridedSlice" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001934 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001935 "common": [
1936 "src/core/NEON/kernels/NEPadLayerKernel.cpp",
1937 "src/runtime/NEON/functions/NEPadLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001938 ]
1939 }
1940 },
1941 "Permute": {
1942 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001943 "common": [
1944 "src/cpu/operators/CpuPermute.cpp",
1945 "src/cpu/kernels/CpuPermuteKernel.cpp",
1946 "src/runtime/NEON/functions/NEPermute.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001947 ]
1948 }
1949 },
1950 "Pool2d": {
1951 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001952 "common": [
1953 "src/cpu/operators/CpuPool2d.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001954 "src/cpu/kernels/CpuPool2dKernel.cpp",
1955 "src/cpu/kernels/internal/CpuPool2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001956 "src/runtime/NEON/functions/NEPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001957 ],
1958 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001959 "common": [
1960 "src/core/NEON/kernels/arm_conv/pooling/kernels/cpp_nhwc_1x1_stride_any_depthfirst/generic.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001961 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp32.cpp",
1962 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8.cpp",
1963 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8q.cpp",
1964 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8.cpp",
1965 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8q.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001966 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1967 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1968 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1969 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1970 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1971 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1972 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_generic_depthfirst/generic.cpp",
1973 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1974 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1975 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1976 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1977 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_generic_depthfirst/generic.cpp",
1978 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001979 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001980 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001981 "nchw": [ "src/cpu/kernels/pool2d/neon/nchw/all.cpp" ],
Pablo Marquez Tello01b0f9b2023-11-07 15:42:46 +00001982 "fp16": [
1983 "src/cpu/kernels/pool2d/neon/fp16.cpp",
1984 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp16.cpp",
1985 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1986 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1987 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1988 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_generic_depthfirst/generic.cpp"
1989 ],
ramelg01a1f78512022-06-29 16:28:10 +01001990 "fp32": [ "src/cpu/kernels/pool2d/neon/fp32.cpp" ],
1991 "qasymm8":[ "src/cpu/kernels/pool2d/neon/qasymm8.cpp" ],
Dana Zlotnika538ae52022-02-21 13:12:41 +02001992 "qasymm8_signed":["src/cpu/kernels/pool2d/neon/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001993 },
1994 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001995 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001996 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1997 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1998 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1999 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_generic_depthfirst/generic.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002000 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
2001 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
2002 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
2003 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_generic_depthfirst/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01002004 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_avg_generic_depthfirst/generic.cpp",
2005 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
2006 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_generic_depthfirst/generic.cpp",
2007 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
2008 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_max_generic_depthfirst/generic.cpp",
2009 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_avg_generic_depthfirst/generic.cpp",
2010 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
2011 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_generic_depthfirst/generic.cpp",
2012 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01002013 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_max_generic_depthfirst/generic.cpp",
2014 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
2015 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
2016 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
2017 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_generic_depthfirst/generic.cpp",
2018 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
2019 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
2020 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
2021 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_generic_depthfirst/generic.cpp",
2022 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_avg_generic_depthfirst/generic.cpp",
2023 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
2024 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_generic_depthfirst/generic.cpp",
2025 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
2026 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_max_generic_depthfirst/generic.cpp",
2027 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_avg_generic_depthfirst/generic.cpp",
2028 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
2029 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_generic_depthfirst/generic.cpp",
2030 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
2031 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002032 ]
2033 }
2034 }
2035 },
Adnan AlSinan171fc3d2022-03-15 18:46:42 +00002036 "Pool3d": {
2037 "files": {
2038 "common": [
2039 "src/cpu/operators/CpuPool3d.cpp",
2040 "src/cpu/kernels/CpuPool3dKernel.cpp",
2041 "src/runtime/NEON/functions/NEPooling3dLayer.cpp"
2042 ],
2043 "neon": {
Adnan AlSinan9104cd52022-04-06 16:19:31 +01002044 "fp16": [ "src/cpu/kernels/pool3d/neon/fp16.cpp" ],
2045 "fp32": [ "src/cpu/kernels/pool3d/neon/fp32.cpp" ],
2046 "qasymm8": [ "src/cpu/kernels/pool3d/neon/qasymm8.cpp" ],
2047 "qasymm8_signed": [ "src/cpu/kernels/pool3d/neon/qasymm8_signed.cpp" ]
Adnan AlSinan171fc3d2022-03-15 18:46:42 +00002048 }
2049 }
2050 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002051 "PRelu": {
2052 "deps": [ "ElementwiseBinary" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01002053 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002054 "common": [
2055 "src/runtime/NEON/functions/NEPReluLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002056 ]
2057 }
2058 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002059 "PriorBox": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002060 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002061 "common": [
2062 "src/core/NEON/kernels/NEPriorBoxLayerKernel.cpp",
2063 "src/runtime/NEON/functions/NEPriorBoxLayer.cpp"
2064 ]
2065 }
2066 },
2067 "Quantize": {
2068 "files": {
2069 "common": [
2070 "src/cpu/operators/CpuQuantize.cpp",
2071 "src/cpu/kernels/CpuQuantizeKernel.cpp",
2072 "src/runtime/NEON/functions/NEQuantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002073 ]
2074 }
2075 },
2076 "Range": {
2077 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002078 "common": [
2079 "src/core/NEON/kernels/NERangeKernel.cpp",
2080 "src/runtime/NEON/functions/NERange.cpp"
Yair Schwarzbaum9e8a7702021-11-08 10:58:06 +02002081 ],
2082 "neon": {
Yair Schwarzbaum9e8a7702021-11-08 10:58:06 +02002083 "fp32": [ "src/cpu/kernels/range/generic/neon/fp32.cpp" ],
2084 "fp16": [ "src/cpu/kernels/range/generic/neon/fp16.cpp" ],
2085 "integer": [ "src/cpu/kernels/range/generic/neon/integer.cpp" ]
2086 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002087 }
2088 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002089 "Reduction":{
2090 "deps": [ "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01002091 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002092 "common": [
2093 "src/core/NEON/kernels/NEReductionOperationKernel.cpp",
2094 "src/runtime/NEON/functions/NEReductionOperation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002095 ]
2096 }
2097 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002098 "Reorg": {
2099 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002100 "common": [
2101 "src/core/NEON/kernels/NEReorgLayerKernel.cpp",
2102 "src/runtime/NEON/functions/NEReorgLayer.cpp"
2103 ]
2104 }
2105 },
2106 "Reshape": {
2107 "files": {
2108 "common": [
2109 "src/cpu/operators/CpuReshape.cpp",
2110 "src/cpu/kernels/CpuReshapeKernel.cpp",
2111 "src/runtime/NEON/functions/NEReshapeLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002112 ]
2113 }
2114 },
David Svantesson3b162e52023-03-28 14:13:32 +00002115 "Reorder": {
2116 "files": {
2117 "common": [
David Svantessonf0ff76d2023-04-28 16:34:52 +00002118 "src/runtime/NEON/functions/NEReorderLayer.cpp",
David Svantesson3b162e52023-03-28 14:13:32 +00002119 "src/core/NEON/kernels/NEReorderKernel.cpp"
2120 ]
2121 }
2122 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002123 "Reverse": {
2124 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002125 "common": [
2126 "src/core/NEON/kernels/NEReverseKernel.cpp",
2127 "src/runtime/NEON/functions/NEReverse.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002128 ]
2129 }
2130 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002131 "RNN": {
2132 "deps": [ "Activation", "Add", "FullyConnected", "Gemm"],
2133 "files": {
2134 "common": [ "src/runtime/NEON/functions/NERNNLayer.cpp" ]
2135 }
2136 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002137 "ROIAlign": {
2138 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002139 "common": [
2140 "src/core/NEON/kernels/NEROIAlignLayerKernel.cpp",
2141 "src/runtime/NEON/functions/NEROIAlignLayer.cpp"
Dana Zlotnik9ae5a4e2022-01-03 16:22:47 +02002142 ],
2143 "neon":{
Dana Zlotnik9ae5a4e2022-01-03 16:22:47 +02002144 "fp32":["src/cpu/kernels/roialign/generic/neon/fp32.cpp"],
2145 "fp16":["src/cpu/kernels/roialign/generic/neon/fp16.cpp"],
2146 "qasymm8":["src/cpu/kernels/roialign/generic/neon/qasymm8.cpp"],
2147 "qasymm8_signed":["src/cpu/kernels/roialign/generic/neon/qasymm8_signed.cpp"]
2148 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002149 }
2150 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002151 "ROIPool2d": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002152 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002153 "common": [
2154 "src/core/NEON/kernels/NEROIPoolingLayerKernel.cpp",
2155 "src/runtime/NEON/functions/NEROIPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002156 ]
2157 }
2158 },
2159 "Scale": {
2160 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002161 "common": [
2162 "src/cpu/operators/CpuScale.cpp",
2163 "src/cpu/kernels/CpuScaleKernel.cpp",
2164 "src/runtime/NEON/functions/NEScale.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002165 ],
2166 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002167 "fp16": [ "src/cpu/kernels/scale/sve/fp16.cpp" ],
2168 "fp32": [ "src/cpu/kernels/scale/sve/fp32.cpp" ],
2169 "integer": [ "src/cpu/kernels/scale/sve/integer.cpp" ],
2170 "qasymm8": [ "src/cpu/kernels/scale/sve/qasymm8.cpp" ],
2171 "qasymm8_signed": [ "src/cpu/kernels/scale/sve/qasymm8_signed.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002172 },
2173 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002174 "fp16": [ "src/cpu/kernels/scale/neon/fp16.cpp" ],
2175 "integer": [ "src/cpu/kernels/scale/neon/integer.cpp" ],
Gunes Bayirc4f27432022-09-11 15:59:19 +01002176 "qasymm8": [ "src/cpu/kernels/scale/neon/qasymm8.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ],
2177 "qasymm8_signed": [ "src/cpu/kernels/scale/neon/qasymm8_signed.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002178 }
2179 }
2180 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002181 "Select": {
2182 "files": {
2183 "common": [
2184 "src/core/NEON/kernels/NESelectKernel.cpp",
2185 "src/runtime/NEON/functions/NESelect.cpp"
Anton Vainer8a9a0fb2022-01-09 14:37:12 +02002186 ],
2187 "neon": {
Anton Vainer8a9a0fb2022-01-09 14:37:12 +02002188 "fp32": [ "src/cpu/kernels/select/generic/neon/fp32.cpp" ],
2189 "fp16": [ "src/cpu/kernels/select/generic/neon/fp16.cpp" ],
2190 "integer": [ "src/cpu/kernels/select/generic/neon/integer.cpp" ]
2191 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002192 }
2193 },
2194 "Slice": {
2195 "deps": [ "StridedSlice" ],
2196 "files": {
2197 "common": [ "src/runtime/NEON/functions/NESlice.cpp" ]
2198 }
2199 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002200 "Softmax": {
2201 "deps": [
2202 "Permute"
2203 ],
2204 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002205 "common": [
2206 "src/cpu/operators/CpuSoftmax.cpp",
2207 "src/cpu/kernels/CpuSoftmaxKernel.cpp",
2208 "src/runtime/NEON/functions/NESoftmaxLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002209 ],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002210 "neon":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02002211 "common":["src/cpu/kernels/softmax/generic/neon/impl.cpp"],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002212 "fp32": ["src/cpu/kernels/softmax/generic/neon/fp32.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01002213 "fp16": ["src/cpu/kernels/softmax/generic/neon/fp16.cpp"],
2214 "qasymm8":[ "src/cpu/kernels/softmax/generic/neon/qasymm8.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002215 "qasymm8_signed":["src/cpu/kernels/softmax/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002216 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002217 "sve": {
Gunes Bayirfadc9b12023-11-07 05:43:07 +00002218 "common": [ "src/cpu/kernels/softmax/generic/sve/impl.cpp" ]
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002219 },
2220 "sve2":{
Gunes Bayirfadc9b12023-11-07 05:43:07 +00002221 "common" :["src/cpu/kernels/softmax/generic/sve2/impl.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002222 }
2223 }
2224 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002225 "SpaceToBatch": {
2226 "files": {
2227 "common": [
2228 "src/core/NEON/kernels/NESpaceToBatchLayerKernel.cpp",
2229 "src/runtime/NEON/functions/NESpaceToBatchLayer.cpp"
2230 ]
2231 }
2232 },
2233 "SpaceToDepth": {
2234 "files": {
2235 "common": [
2236 "src/core/NEON/kernels/NESpaceToDepthLayerKernel.cpp",
2237 "src/runtime/NEON/functions/NESpaceToDepthLayer.cpp"
2238 ]
2239 }
2240 },
2241 "Split": {
2242 "deps": [ "StridedSlice" ],
2243 "files": {
2244 "common": [
2245 "src/runtime/NEON/functions/NESplit.cpp"
2246 ]
2247 }
2248 },
2249 "Stack": {
2250 "files": {
2251 "common": [
2252 "src/core/NEON/kernels/NEStackLayerKernel.cpp",
2253 "src/runtime/NEON/functions/NEStackLayer.cpp"
2254 ]
2255 }
2256 },
2257 "StridedSlice": {
2258 "files": {
2259 "common": [
2260 "src/core/NEON/kernels/NEStridedSliceKernel.cpp",
2261 "src/runtime/NEON/functions/NEStridedSlice.cpp"
2262 ]
2263 }
2264 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002265 "Sub": {
2266 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002267 "common": [
2268 "src/cpu/operators/CpuSub.cpp",
2269 "src/cpu/kernels/CpuSubKernel.cpp",
Pablo Marquez Tello67773592023-10-06 13:49:44 +01002270 "src/runtime/NEON/functions/NEArithmeticSubtraction.cpp"
2271 ],
2272 "neon": {
2273 "fp16":["src/cpu/kernels/sub/neon/fp16.cpp"],
2274 "qasymm8": ["src/cpu/kernels/sub/neon/qasymm8.cpp"],
2275 "qasymm8_signed": ["src/cpu/kernels/sub/neon/qasymm8_signed.cpp"],
2276 "qsymm16": ["src/cpu/kernels/sub/neon/qsymm16.cpp"]
2277 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002278 }
2279 },
Pablo Marquez Tello67773592023-10-06 13:49:44 +01002280
Michalis Spyrou20fca522021-06-07 14:23:57 +01002281 "Tile": {
2282 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002283 "common": [
2284 "src/core/NEON/kernels/NETileKernel.cpp",
2285 "src/runtime/NEON/functions/NETile.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002286 ]
2287 }
2288 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002289 "Transpose": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002290 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002291 "common": [
2292 "src/cpu/kernels/CpuTransposeKernel.cpp",
2293 "src/cpu/operators/CpuTranspose.cpp",
2294 "src/runtime/NEON/functions/NETranspose.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002295 ]
2296 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002297 },
2298 "Unstack": {
2299 "deps": [ "StridedSlice" ],
2300 "files": {
2301 "common": [ "src/runtime/NEON/functions/NEUnstack.cpp" ]
2302 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002303 }
2304 }
Giorgio Arena232c4522022-03-03 10:09:01 +00002305 },
2306 "experimental": {
SiCong Li23882a92023-06-28 09:49:45 +01002307 "dynamic_fusion": {
2308 "common": [
2309 "src/dynamic_fusion/runtime/gpu/cl/ClKernelRuntime.cpp",
2310 "src/dynamic_fusion/runtime/gpu/cl/ClWorkloadRuntime.cpp",
2311 "src/dynamic_fusion/sketch/attributes/CastAttributes.cpp",
2312 "src/dynamic_fusion/sketch/attributes/ClampAttributes.cpp",
2313 "src/dynamic_fusion/sketch/attributes/Conv2dAttributes.cpp",
2314 "src/dynamic_fusion/sketch/attributes/DepthwiseConv2dAttributes.cpp",
Adnan AlSinand9c1d442023-10-06 19:07:48 +01002315 "src/dynamic_fusion/sketch/attributes/MatMulAttributes.cpp",
SiCong Li23882a92023-06-28 09:49:45 +01002316 "src/dynamic_fusion/sketch/attributes/Pool2dAttributes.cpp",
2317 "src/dynamic_fusion/sketch/attributes/ResizeAttributes.cpp",
2318 "src/dynamic_fusion/sketch/attributes/SoftmaxAttributes.cpp",
2319 "src/dynamic_fusion/sketch/attributes/ReshapeAttributes.cpp",
2320 "src/dynamic_fusion/sketch/gpu/GpuKernelArgument.cpp",
2321 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGraph.cpp",
2322 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGroup.cpp",
2323 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentStream.cpp",
2324 "src/dynamic_fusion/sketch/gpu/GpuLogicalKernel.cpp",
2325 "src/dynamic_fusion/sketch/gpu/GpuOperatorGroup.cpp",
2326 "src/dynamic_fusion/sketch/gpu/GpuWorkloadContext.cpp",
2327 "src/dynamic_fusion/sketch/gpu/GpuWorkloadSketch.cpp",
2328 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentActivation.cpp",
2329 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentCast.cpp",
2330 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDepthwiseConv2d.cpp",
2331 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDirectConv2d.cpp",
Adnan AlSinand9c1d442023-10-06 19:07:48 +01002332 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentMatMul.cpp",
SiCong Li23882a92023-06-28 09:49:45 +01002333 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentPool2d.cpp",
2334 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentElementwiseBinary.cpp",
2335 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentLogits1DMaxShiftExpSum.cpp",
2336 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentLogits1DNorm.cpp",
2337 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentReshape.cpp",
2338 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentResize.cpp",
2339 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentStore.cpp",
2340 "src/dynamic_fusion/sketch/gpu/operators/GpuAdd.cpp",
2341 "src/dynamic_fusion/sketch/gpu/operators/GpuCast.cpp",
2342 "src/dynamic_fusion/sketch/gpu/operators/GpuClamp.cpp",
2343 "src/dynamic_fusion/sketch/gpu/operators/GpuConv2d.cpp",
2344 "src/dynamic_fusion/sketch/gpu/operators/GpuDepthwiseConv2d.cpp",
Adnan AlSinand9c1d442023-10-06 19:07:48 +01002345 "src/dynamic_fusion/sketch/gpu/operators/GpuMatMul.cpp",
SiCong Li23882a92023-06-28 09:49:45 +01002346 "src/dynamic_fusion/sketch/gpu/operators/GpuMul.cpp",
2347 "src/dynamic_fusion/sketch/gpu/operators/GpuReshape.cpp",
2348 "src/dynamic_fusion/sketch/gpu/operators/GpuPool2d.cpp",
2349 "src/dynamic_fusion/sketch/gpu/operators/GpuOutput.cpp",
2350 "src/dynamic_fusion/sketch/gpu/operators/GpuResize.cpp",
2351 "src/dynamic_fusion/sketch/gpu/operators/GpuSigmoid.cpp",
2352 "src/dynamic_fusion/sketch/gpu/operators/GpuSoftmax.cpp",
2353 "src/dynamic_fusion/sketch/gpu/operators/GpuSub.cpp",
2354 "src/dynamic_fusion/sketch/gpu/operators/GpuTanh.cpp",
2355 "src/dynamic_fusion/sketch/gpu/operators/internal/GpuElementwiseBinaryCommon.cpp"
2356 ],
2357 "template_writer": [
2358 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateActivation.cpp",
2359 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateCast.cpp",
2360 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDepthwiseConv2d.cpp",
2361 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp",
2362 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplatePool2d.cpp",
2363 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateElementwiseBinary.cpp",
2364 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateLogits1DMaxShiftExpSum.cpp",
2365 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateLogits1DNorm.cpp",
2366 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateReshape.cpp",
2367 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateResize.cpp",
2368 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateStore.cpp",
2369 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateWriter.cpp",
2370 "src/dynamic_fusion/sketch/gpu/template_writer/GpuKernelVariableTable.cpp"
2371 ],
2372 "ckw_driver": [
2373 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwComponentArgument.cpp",
2374 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwDriver.cpp",
2375 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwActivation.cpp",
2376 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwCast.cpp",
ramy.elgammal@arm.coma04ae3e2023-07-27 18:23:17 +01002377 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwDepthwiseConv2d.cpp",
Jakub Sujake1c96e72023-07-31 13:36:58 +01002378 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwDirectConv2d.cpp",
SiCong Li23882a92023-06-28 09:49:45 +01002379 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwElementwiseBinary.cpp",
Adnan AlSinan2e6d6592023-08-21 13:54:27 +01002380 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwPool2d.cpp",
Adnan AlSinand9c1d442023-10-06 19:07:48 +01002381 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwMatMul.cpp",
Gunes Bayir91cb7332023-07-25 17:00:33 +01002382 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwResize.cpp",
SiCong Li23882a92023-06-28 09:49:45 +01002383 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwStore.cpp",
2384 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwKernelWriter.cpp",
2385 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwScopedKernelWriter.cpp",
2386 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwVariableTable.cpp",
2387 "src/dynamic_fusion/runtime/gpu/cl/ckw_driver/GpuCkwKernelArgumentsHelpers.cpp"
2388 ]
2389 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002390 }
ramelg018a164882022-04-07 02:42:52 +01002391}