blob: 3bdc00aeef661301def73f21e0cd3683783ea412 [file] [log] [blame]
Georgios Pinitasbdcdc392021-04-22 16:42:03 +01001{
Michalis Spyrou20fca522021-06-07 14:23:57 +01002 "common": [
3 "src/common/cpuinfo/CpuInfo.cpp",
4 "src/common/cpuinfo/CpuModel.cpp",
5 "src/common/cpuinfo/CpuIsaInfo.cpp",
6 "src/common/utils/LegacySupport.cpp",
7 "src/common/AllocatorWrapper.cpp",
8 "src/common/ITensorV2.cpp",
Georgios Pinitas41648142021-08-03 08:24:00 +01009 "src/common/TensorPack.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010010 "src/common/IOperator.cpp",
11 "src/core/AccessWindowAutoPadding.cpp",
12 "src/core/AccessWindowStatic.cpp",
13 "src/core/AccessWindowTranspose.cpp",
14 "src/core/Error.cpp",
15 "src/core/GPUTarget.cpp",
16 "src/core/Helpers.cpp",
17 "src/core/IAccessWindow.cpp",
18 "src/core/IKernel.cpp",
19 "src/core/ITensor.cpp",
20 "src/core/ITensorPack.cpp",
21 "src/core/Rounding.cpp",
22 "src/core/Size2D.cpp",
23 "src/core/SubTensorInfo.cpp",
24 "src/core/TensorInfo.cpp",
25 "src/core/Utils.cpp",
26 "src/core/Validate.cpp",
27 "src/core/Version.cpp",
28 "src/core/helpers/SoftmaxHelpers.cpp",
29 "src/core/helpers/WindowHelpers.cpp",
30 "src/core/utils/AssemblyUtils.cpp",
31 "src/core/utils/ScaleUtils.cpp",
32 "src/core/utils/helpers/fft.cpp",
33 "src/core/utils/helpers/tensor_transform.cpp",
34 "src/core/utils/io/FileHandler.cpp",
35 "src/core/utils/misc/MMappedFile.cpp",
36 "src/core/utils/quantization/AsymmHelpers.cpp",
37 "src/core/CPP/CPPTypes.cpp",
38 "src/core/CPP/kernels/CPPBoxWithNonMaximaSuppressionLimitKernel.cpp",
39 "src/core/CPP/kernels/CPPNonMaximumSuppressionKernel.cpp",
40 "src/core/CPP/kernels/CPPPermuteKernel.cpp",
41 "src/core/CPP/kernels/CPPTopKVKernel.cpp",
42 "src/core/CPP/kernels/CPPUpsampleKernel.cpp",
43 "src/runtime/Allocator.cpp",
44 "src/runtime/BlobLifetimeManager.cpp",
45 "src/runtime/BlobMemoryPool.cpp",
46 "src/runtime/ISimpleLifetimeManager.cpp",
47 "src/runtime/ITensorAllocator.cpp",
48 "src/runtime/IWeightsManager.cpp",
49 "src/runtime/IScheduler.cpp",
50 "src/runtime/Memory.cpp",
51 "src/runtime/MemoryManagerOnDemand.cpp",
52 "src/runtime/OffsetLifetimeManager.cpp",
53 "src/runtime/OffsetMemoryPool.cpp",
54 "src/runtime/OperatorTensor.cpp",
55 "src/runtime/PoolManager.cpp",
56 "src/runtime/RuntimeContext.cpp",
57 "src/runtime/Scheduler.cpp",
58 "src/runtime/SchedulerFactory.cpp",
59 "src/runtime/SchedulerUtils.cpp",
60 "src/runtime/SubTensor.cpp",
61 "src/runtime/Tensor.cpp",
62 "src/runtime/TensorAllocator.cpp",
63 "src/runtime/Utils.cpp",
64 "src/runtime/CPP/ICPPSimpleFunction.cpp",
65 "src/runtime/CPP/functions/CPPBoxWithNonMaximaSuppressionLimit.cpp",
66 "src/runtime/CPP/functions/CPPDetectionOutputLayer.cpp",
67 "src/runtime/CPP/functions/CPPDetectionPostProcessLayer.cpp",
68 "src/runtime/CPP/functions/CPPNonMaximumSuppression.cpp",
69 "src/runtime/CPP/functions/CPPPermute.cpp",
70 "src/runtime/CPP/functions/CPPTopKV.cpp",
71 "src/runtime/CPP/functions/CPPUpsample.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +010072 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +010073 "logging": [
74 "src/core/utils/logging/FilePrinter.cpp",
75 "src/core/utils/logging/Helpers.cpp",
76 "src/core/utils/logging/Logger.cpp",
77 "src/core/utils/logging/LoggerRegistry.cpp"
78 ],
79 "scheduler": {
80 "single": [ "src/runtime/CPP/SingleThreadScheduler.cpp" ],
81 "threads": [ "src/runtime/CPP/CPPScheduler.cpp" ],
82 "omp": [ "src/runtime/OMP/OMPScheduler.cpp"]
83 },
Michalis Spyrou20fca522021-06-07 14:23:57 +010084 "c_api": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +010085 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +010086 "src/c/AclContext.cpp",
Georgios Pinitas06ac6e42021-07-05 08:08:52 +010087 "src/c/AclOperator.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +010088 "src/c/AclQueue.cpp",
89 "src/c/AclTensor.cpp",
90 "src/c/AclTensorPack.cpp",
91 "src/c/AclVersion.cpp"
Georgios Pinitasbdcdc392021-04-22 16:42:03 +010092 ],
Georgios Pinitas13ef1762021-07-14 17:14:43 +010093 "cpu": [
94 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +010095 "gpu": [
96 "src/c/cl/AclOpenClExt.cpp"
Georgios Pinitas41648142021-08-03 08:24:00 +010097 ],
98 "operators":
99 [
100 "src/c/operators/AclActivation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100101 ]
102 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100103 "high_priority": [
104 "Activation",
105 "DepthwiseConv2d",
106 "Conv2d",
107 "Permute",
108 "Pool2d",
109 "Reshape"
110 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100111 "gpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100112 "common": [
113 "src/core/CL/CLCompileContext.cpp",
Giorgio Arenaba2dd822021-07-28 16:10:03 +0100114 "src/core/CL/DefaultLWSHeuristics.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100115 "src/core/CL/CLHelpers.cpp",
116 "src/core/CL/CLKernelLibrary.cpp",
117 "src/core/CL/CLUtils.cpp",
118 "src/core/CL/ICLKernel.cpp",
119 "src/core/CL/ICLSimple2DKernel.cpp",
120 "src/core/CL/ICLSimple3DKernel.cpp",
121 "src/core/CL/ICLSimpleKernel.cpp",
122 "src/core/CL/ICLTensor.cpp",
123 "src/core/CL/OpenCL.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100124 "src/gpu/cl/ClContext.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100125 "src/gpu/cl/ClKernelLibrary.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100126 "src/gpu/cl/ClQueue.cpp",
127 "src/gpu/cl/ClTensor.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100128 "src/core/CL/kernels/CLFillBorderKernel.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100129 "src/runtime/CL/CLBufferAllocator.cpp",
130 "src/runtime/CL/CLGEMMHeuristicsHandle.cpp",
131 "src/runtime/CL/CLHelpers.cpp",
132 "src/runtime/CL/CLMemory.cpp",
133 "src/runtime/CL/CLMemoryRegion.cpp",
134 "src/runtime/CL/CLOperator.cpp",
135 "src/runtime/CL/CLRuntimeContext.cpp",
136 "src/runtime/CL/CLScheduler.cpp",
137 "src/runtime/CL/CLSubTensor.cpp",
138 "src/runtime/CL/CLTensor.cpp",
139 "src/runtime/CL/CLTensorAllocator.cpp",
140 "src/runtime/CL/CLTuner.cpp",
141 "src/runtime/CL/ICLSimpleFunction.cpp",
142 "src/runtime/CL/Utils.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100143 "src/runtime/CL/mlgo/HeuristicTree.cpp",
144 "src/runtime/CL/mlgo/MLGOHeuristics.cpp",
145 "src/runtime/CL/mlgo/MLGOParser.cpp",
146 "src/runtime/CL/mlgo/Utils.cpp",
147 "src/runtime/CL/tuners/CLTuningParametersList.cpp"
148 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100149 "operators": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100150 "Activation":{
151 "files": {
152 "common": [
153 "src/gpu/cl/kernels/ClActivationKernel.cpp",
154 "src/gpu/cl/operators/ClActivation.cpp",
155 "src/runtime/CL/functions/CLActivationLayer.cpp"
156 ]
157 }
158 },
159 "ArgMinMax": {
160 "deps": [ "Reshape" ],
161 "files": {
162 "common": [
163 "src/core/CL/kernels/CLArgMinMaxLayerKernel.cpp",
164 "src/runtime/CL/functions/CLArgMinMaxLayer.cpp"
165 ]
166 }
167 },
168 "Add": {
169 "files": {
170 "common": [
171 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
172 "src/gpu/cl/operators/ClAdd.cpp"
173 ]
174 }
175 },
176 "BatchNormalization": {
177 "files": {
178 "common": [
179 "src/core/CL/kernels/CLBatchNormalizationLayerKernel.cpp",
180 "src/core/CL/kernels/CLFuseBatchNormalizationKernel.cpp",
181 "src/runtime/CL/functions/CLBatchNormalizationLayer.cpp",
182 "src/runtime/CL/functions/CLFuseBatchNormalization.cpp"
183 ]
184 }
185 },
186 "BatchToSpace": {
187 "files": {
188 "common": [
189 "src/core/CL/kernels/CLBatchToSpaceLayerKernel.cpp",
190 "src/runtime/CL/functions/CLBatchToSpaceLayer.cpp"
191 ]
192 }
193 },
194 "Bitwise": {
195 "files": {
196 "common": [ "src/core/CL/kernels/CLBitwiseKernel.cpp" ]
197 }
198 },
199 "BitwiseAnd": {
200 "deps": [ "Bitwise" ],
201 "files": {
202 "common": [ "src/runtime/CL/functions/CLBitwiseAnd.cpp" ]
203 }
204 },
205 "BitwiseNot": {
206 "deps": [ "Bitwise" ],
207 "files": {
208 "common": [ "src/runtime/CL/functions/CLBitwiseNot.cpp" ]
209 }
210 },
211 "BitwiseOr": {
212 "deps": [ "Bitwise" ],
213 "files": {
214 "common": [ "src/runtime/CL/functions/CLBitwiseOr.cpp" ]
215 }
216 },
217 "BitwiseXor": {
218 "deps": [ "Bitwise" ],
219 "files": {
220 "common": [ "src/runtime/CL/functions/CLBitwiseXor.cpp" ]
221 }
222 },
223 "BoundingBoxTransform": {
224 "files": {
225 "common": [
226 "src/core/CL/kernels/CLBoundingBoxTransformKernel.cpp",
227 "src/runtime/CL/functions/CLBoundingBoxTransform.cpp"
228 ]
229 }
230 },
231 "Cast": {
232 "files": {
233 "common": [
234 "src/gpu/cl/kernels/ClCastKernel.cpp",
235 "src/gpu/cl/operators/ClCast.cpp",
236 "src/runtime/CL/functions/CLCast.cpp"
237 ]
238 }
239 },
240 "ChannelShuffle": {
241 "files": {
242 "common": [
243 "src/core/CL/kernels/CLChannelShuffleLayerKernel.cpp",
244 "src/runtime/CL/functions/CLChannelShuffleLayer.cpp"
245 ]
246 }
247 },
248 "Comparison": {
249 "files": {
250 "common": [
251 "src/core/CL/kernels/CLComparisonKernel.cpp",
252 "src/runtime/CL/functions/CLComparison.cpp"
253 ]
254 }
255 },
256 "Concatenate": {
257 "files": {
258 "common": [
259 "src/gpu/cl/kernels/ClBatchConcatenateKernel.cpp",
260 "src/gpu/cl/kernels/ClDepthConcatenateKernel.cpp",
261 "src/gpu/cl/kernels/ClHeightConcatenateKernel.cpp",
262 "src/gpu/cl/kernels/ClWidthConcatenate2TensorsKernel.cpp",
263 "src/gpu/cl/kernels/ClWidthConcatenate4TensorsKernel.cpp",
264 "src/gpu/cl/kernels/ClWidthConcatenateKernel.cpp",
265 "src/gpu/cl/operators/ClConcatenate.cpp",
266 "src/runtime/CL/functions/CLConcatenateLayer.cpp"
267 ]
268 }
269 },
270 "Conv2d": {
271 "deps": [
272 "Activation",
273 "ElementwiseBinary",
274 "FFT2D",
275 "Gemm",
276 "Mul",
277 "Pad",
278 "Permute",
279 "Reduction",
280 "Reshape",
281 "Reverse",
282 "Slice"
283 ],
284 "files": {
285 "common": [
286 "src/gpu/cl/kernels/ClDirectConv2dKernel.cpp",
287 "src/gpu/cl/kernels/ClWinogradFilterTransformKernel.cpp",
288 "src/gpu/cl/kernels/ClWinogradInputTransformKernel.cpp",
289 "src/gpu/cl/kernels/ClWinogradOutputTransformKernel.cpp",
290 "src/gpu/cl/kernels/ClIm2ColKernel.cpp",
291 "src/gpu/cl/kernels/ClCol2ImKernel.cpp",
292 "src/gpu/cl/operators/ClConv2d.cpp",
293 "src/gpu/cl/operators/ClDirectConv2d.cpp",
294 "src/gpu/cl/operators/ClGemmConv2d.cpp",
295 "src/gpu/cl/operators/ClWinogradConv2d.cpp",
296 "src/gpu/cl/kernels/ClWeightsReshapeKernel.cpp",
297 "src/runtime/CL/functions/CLConvolutionLayer.cpp",
298 "src/runtime/CL/functions/CLDirectConvolutionLayer.cpp",
299 "src/runtime/CL/functions/CLFFTConvolutionLayer.cpp",
300 "src/runtime/CL/functions/CLGEMMConvolutionLayer.cpp",
301 "src/runtime/CL/functions/CLWinogradConvolutionLayer.cpp"
302 ]
303 }
304 },
Giorgio Arena273c28c2021-10-14 15:59:15 +0100305 "Conv3d": {
306 "files": {
307 "common": [
308 "src/gpu/cl/kernels/ClDirectConv3dKernel.cpp",
309 "src/gpu/cl/operators/ClDirectConv3d.cpp",
310 "src/runtime/CL/functions/CLConv3D.cpp"
311 ]
312 }
313 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100314 "Copy": {
315 "files": {
316 "common": [
317 "src/gpu/cl/kernels/ClCopyKernel.cpp",
318 "src/gpu/cl/operators/ClCopy.cpp",
319 "src/runtime/CL/functions/CLCopy.cpp"
320 ]
321 }
322 },
323 "CropResize": {
324 "deps": [ "Copy", "Fill", "Scale" ],
325 "files": {
326 "common": [
327 "src/gpu/cl/kernels/ClCropKernel.cpp",
328 "src/gpu/cl/operators/ClCrop.cpp",
329 "src/runtime/CL/functions/CLCrop.cpp",
330 "src/runtime/CL/functions/CLCropResize.cpp"
331 ]
332 }
333 },
334 "Deconv2d": {
335 "deps": [ "Conv2d", "Reverse", "Transpose"],
336 "files": {
337 "common": [
338 "src/core/CL/kernels/CLDeconvolutionLayerUpsampleKernel.cpp",
339 "src/core/CL/kernels/CLDeconvolutionReshapeOutputKernel.cpp",
340 "src/runtime/CL/functions/CLDeconvolutionLayer.cpp",
341 "src/runtime/CL/functions/CLDeconvolutionLayerUpsample.cpp",
342 "src/runtime/CL/functions/CLDirectDeconvolutionLayer.cpp",
343 "src/runtime/CL/functions/CLGEMMDeconvolutionLayer.cpp"
344 ]
345 }
346 },
347 "DepthConvert": {
348 "deps": [ "Cast"],
349 "files": {
350 "common": [ "src/runtime/CL/functions/CLDepthConvertLayer.cpp" ]
351 }
352 },
353 "DepthToSpace": {
354 "files": {
355 "common": [
356 "src/core/CL/kernels/CLDepthToSpaceLayerKernel.cpp",
357 "src/runtime/CL/functions/CLDepthToSpaceLayer.cpp"
358 ]
359 }
360 },
361 "DepthwiseConv2d": {
362 "deps": [ "Permute" ],
363 "files": {
364 "common": [
365 "src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp",
366 "src/runtime/CL/functions/CLDepthwiseConvolutionLayer.cpp"
367 ]
368 }
369 },
370 "Dequantize": {
371 "files": {
372 "common": [
373 "src/gpu/cl/kernels/ClDequantizeKernel.cpp",
374 "src/gpu/cl/operators/ClDequantize.cpp",
375 "src/runtime/CL/functions/CLDequantizationLayer.cpp"
376 ]
377 }
378 },
379 "ElementwiseBinary": {
380 "deps": ["Add", "Sub"],
381 "files": {
382 "common": [
383 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
384 "src/gpu/cl/operators/ClElementwiseOperations.cpp",
385 "src/runtime/CL/functions/CLElementwiseOperations.cpp"
386 ]
387 }
388 },
389 "ElementwiseUnary":{
390 "files": {
391 "common": [
392 "src/gpu/cl/kernels/ClElementwiseUnaryKernel.cpp",
393 "src/gpu/cl/operators/ClElementwiseUnary.cpp",
394 "src/runtime/CL/functions/CLElementwiseUnaryLayer.cpp"
395 ]
396 }
397 },
398 "FFT1D": {
399 "files": {
400 "common": [
401 "src/core/CL/kernels/CLFFTDigitReverseKernel.cpp",
402 "src/core/CL/kernels/CLFFTRadixStageKernel.cpp",
403 "src/core/CL/kernels/CLFFTScaleKernel.cpp",
404 "src/runtime/CL/functions/CLFFT1D.cpp"
405 ]
406 }
407 },
408 "FFT2D": {
409 "deps": [ "FFT1D" ],
410 "files": {
411 "common": [ "src/runtime/CL/functions/CLFFT2D.cpp" ]
412 }
413 },
414 "Fill": {
415 "files": {
416 "common": [
417 "src/gpu/cl/kernels/ClFillKernel.cpp",
418 "src/gpu/cl/operators/ClFill.cpp",
419 "src/runtime/CL/functions/CLFill.cpp"
420 ]
421 }
422 },
423 "Flatten": {
424 "files": {
425 "common": [
426 "src/gpu/cl/operators/ClFlatten.cpp",
427 "src/runtime/CL/functions/CLFlattenLayer.cpp"
428 ]
429 }
430 },
431 "Floor": {
432 "files": {
433 "common": [
434 "src/gpu/cl/kernels/ClFloorKernel.cpp",
435 "src/gpu/cl/operators/ClFloor.cpp",
436 "src/runtime/CL/functions/CLFloor.cpp"
437 ]
438 }
439 },
440 "FullyConnected": {
441 "deps": [ "Flatten", "Gemm", "Transpose"],
442 "files": {
443 "common": [
444 "src/gpu/cl/kernels/ClConvertFullyConnectedWeightsKernel.cpp",
445 "src/gpu/cl/operators/ClConvertFullyConnectedWeights.cpp",
446 "src/gpu/cl/operators/ClFullyConnected.cpp",
447 "src/runtime/CL/functions/CLConvertFullyConnectedWeights.cpp",
448 "src/runtime/CL/functions/CLFullyConnectedLayer.cpp"
449 ]
450 }
451 },
452 "Gather": {
453 "files": {
454 "common": [
455 "src/core/CL/kernels/CLGatherKernel.cpp",
456 "src/runtime/CL/functions/CLGather.cpp"]
457 }
458 },
459 "Gemm": {
460 "deps": [ "Cast" ],
461 "files": {
462 "common": [
463 "src/gpu/cl/kernels/gemm/ClGemmHelpers.cpp",
464 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeBifrost.cpp",
465 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeMidgard.cpp",
466 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeValhall.cpp",
467 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedBifrost.cpp",
468 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedValhall.cpp",
469 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyBifrost.cpp",
470 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyValhall.cpp",
471 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyNativeKernel.cpp",
472 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedKernel.cpp",
473 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsKernel.cpp",
474 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionKernel.cpp",
475 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionOutputStageKernel.cpp",
476 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFixedPointKernel.cpp",
477 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFloatKernel.cpp",
478 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100479 "src/gpu/cl/kernels/ClGemmMatrixMultiplyNativeKernel.cpp",
480 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedKernel.cpp",
481 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsKernel.cpp",
482 "src/gpu/cl/kernels/ClGemmReshapeLhsMatrixKernel.cpp",
483 "src/gpu/cl/kernels/ClGemmReshapeRhsMatrixKernel.cpp",
484 "src/gpu/cl/kernels/ClGemmLowpReductionKernel.cpp",
485 "src/gpu/cl/operators/ClGemm.cpp",
486 "src/gpu/cl/operators/ClGemmLowpMatrixMultiplyCore.cpp",
487 "src/gpu/cl/operators/ClGemmLowpOutputStage.cpp",
488 "src/runtime/CL/gemm/CLGEMMDefaultTypeBifrost.cpp",
489 "src/runtime/CL/gemm/CLGEMMDefaultTypeMidgard.cpp",
490 "src/runtime/CL/gemm/CLGEMMDefaultTypeValhall.cpp",
491 "src/runtime/CL/gemm_auto_heuristics/CLGEMMAutoHeuristics.cpp",
492 "src/runtime/CL/functions/CLGEMM.cpp",
493 "src/runtime/CL/functions/CLGEMMLowpMatrixMultiplyCore.cpp",
494 "src/runtime/CL/functions/CLGEMMLowpOutputStage.cpp"
495 ]
496 }
497 },
498 "GenerateProposals": {
499 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
500 "files": {
501 "common": [
502 "src/core/CL/kernels/CLGenerateProposalsLayerKernel.cpp",
503 "src/runtime/CL/functions/CLGenerateProposalsLayer.cpp"
504 ]
505 }
506 },
507 "InstanceNormalize": {
508 "files": {
509 "common": [
510 "src/core/CL/kernels/CLInstanceNormalizationLayerKernel.cpp",
511 "src/runtime/CL/functions/CLInstanceNormalizationLayer.cpp"
512 ]
513 }
514 },
515 "L2Normalize": {
516 "deps": [ "Reduction" ],
517 "files": {
518 "common": [
519 "src/core/CL/kernels/CLL2NormalizeLayerKernel.cpp",
520 "src/runtime/CL/functions/CLL2NormalizeLayer.cpp"
521 ]
522 }
523 },
524 "Logical": {
525 "files": {
526 "common": [
527 "src/gpu/cl/operators/ClLogicalNot.cpp",
528 "src/runtime/CL/functions/CLLogicalAnd.cpp",
529 "src/runtime/CL/functions/CLLogicalNot.cpp",
530 "src/runtime/CL/functions/CLLogicalOr.cpp"
531 ]
532 }
533 },
534 "LSTM": {
535 "deps": [
536 "Activation",
537 "Concatenate",
538 "Copy",
539 "Dequantize",
540 "ElementwiseBinary",
541 "Fill",
542 "FullyConnected",
543 "Gemm",
544 "MeanStdDevNormalize",
545 "Mul",
546 "Quantize",
547 "Slice",
548 "Transpose"
549 ],
550 "files": {
551 "common": [
552 "src/core/CL/kernels/CLQLSTMLayerNormalizationKernel.cpp",
553 "src/runtime/CL/functions/CLQLSTMLayer.cpp",
554 "src/runtime/CL/functions/CLLSTMLayer.cpp",
555 "src/runtime/CL/functions/CLLSTMLayerQuantized.cpp"
556 ]
557 }
558 },
559 "MaxUnpool2d": {
560 "deps": [ "Fill" ],
561 "files": {
562 "common": [
563 "src/core/CL/kernels/CLMaxUnpoolingLayerKernel.cpp",
564 "src/runtime/CL/functions/CLMaxUnpoolingLayer.cpp"
565 ]
566 }
567 },
568 "MeanStdDevNormalize": {
569 "deps": [ "Reduction" ],
570 "files": {
571 "common": [
572 "src/core/CL/kernels/CLMeanStdDevNormalizationKernel.cpp",
573 "src/runtime/CL/functions/CLMeanStdDevNormalizationLayer.cpp",
574 "src/runtime/CL/functions/CLReduceMean.cpp"
575 ]
576 }
577 },
578 "Mul": {
579 "files": {
580 "common": [
581 "src/gpu/cl/kernels/ClMulKernel.cpp",
582 "src/gpu/cl/operators/ClMul.cpp",
583 "src/runtime/CL/functions/CLPixelWiseMultiplication.cpp"
584 ]
585 }
586 },
587 "Normalize": {
588 "files": {
589 "common": [
590 "src/core/CL/kernels/CLNormalizationLayerKernel.cpp",
591 "src/runtime/CL/functions/CLNormalizationLayer.cpp"
592 ]
593 }
594 },
595 "Pad": {
596 "deps": [ "Copy" ],
597 "files": {
598 "common": [
599 "src/core/CL/kernels/CLPadLayerKernel.cpp",
600 "src/runtime/CL/functions/CLPadLayer.cpp"
601 ]
602 }
603 },
604 "Permute": {
605 "files": {
606 "common": [
607 "src/gpu/cl/kernels/ClPermuteKernel.cpp",
608 "src/gpu/cl/operators/ClPermute.cpp",
609 "src/runtime/CL/functions/CLPermute.cpp"
610 ]
611 }
612 },
613 "Pool2d": {
614 "files": {
615 "common": [
616 "src/gpu/cl/kernels/ClPool2dKernel.cpp",
617 "src/gpu/cl/operators/ClPool2d.cpp",
618 "src/runtime/CL/functions/CLPoolingLayer.cpp"
619 ]
620 }
621 },
622 "PRelu": {
623 "deps": [ "ElementwiseBinary" ],
624 "files": {
625 "common": [
626 "src/gpu/cl/operators/ClPRelu.cpp",
627 "src/runtime/CL/functions/CLPReluLayer.cpp"
628 ]
629 }
630 },
631 "PriorBox": {
632 "files": {
633 "common": [
634 "src/core/CL/kernels/CLPriorBoxLayerKernel.cpp",
635 "src/runtime/CL/functions/CLPriorBoxLayer.cpp"
636 ]
637 }
638 },
639 "Quantize": {
640 "files": {
641 "common": [
642 "src/gpu/cl/kernels/ClQuantizeKernel.cpp",
643 "src/gpu/cl/operators/ClQuantize.cpp",
644 "src/runtime/CL/functions/CLQuantizationLayer.cpp"
645 ]
646 }
647 },
648 "Range": {
649 "files": {
650 "common": [
651 "src/core/CL/kernels/CLRangeKernel.cpp",
652 "src/runtime/CL/functions/CLRange.cpp"
653 ]
654 }
655 },
656 "Reduction": {
657 "deps": [ "Reshape" ],
658 "files": {
659 "common": [
660 "src/core/CL/kernels/CLReductionOperationKernel.cpp",
661 "src/runtime/CL/functions/CLReductionOperation.cpp"
662 ]
663 }
664 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100665 "Reorg": {
666 "files": {
667 "common": [
668 "src/core/CL/kernels/CLReorgLayerKernel.cpp",
669 "src/runtime/CL/functions/CLReorgLayer.cpp"
670 ]
671 }
672 },
673 "Reshape": {
674 "files": {
675 "common": [
676 "src/gpu/cl/kernels/ClReshapeKernel.cpp",
677 "src/gpu/cl/operators/ClReshape.cpp",
678 "src/runtime/CL/functions/CLReshapeLayer.cpp"
679 ]
680 }
681 },
682 "Reverse": {
683 "files": {
684 "common": [
685 "src/core/CL/kernels/CLReverseKernel.cpp",
686 "src/runtime/CL/functions/CLReverse.cpp"
687 ]
688 }
689 },
690 "RNN": {
691 "deps": [ "Activation", "Cast", "ElementwiseBinary", "FullyConnected", "Gemm"],
692 "files": {
693 "common": [ "src/runtime/CL/functions/CLRNNLayer.cpp" ]
694 }
695 },
696 "ROIAlign": {
697 "files": {
698 "common": [
699 "src/core/CL/kernels/CLROIAlignLayerKernel.cpp",
700 "src/runtime/CL/functions/CLROIAlignLayer.cpp"
701 ]
702 }
703 },
704 "ROIPool2d": {
705 "files": {
706 "common": [
707 "src/core/CL/kernels/CLROIPoolingLayerKernel.cpp",
708 "src/runtime/CL/functions/CLROIPoolingLayer.cpp"
709 ]
710 }
711 },
712 "Scale": {
713 "files": {
714 "common": [
715 "src/gpu/cl/kernels/ClScaleKernel.cpp",
716 "src/gpu/cl/operators/ClScale.cpp",
717 "src/runtime/CL/functions/CLScale.cpp"
718 ]
719 }
720 },
721 "Select": {
722 "files": {
723 "common": [
724 "src/core/CL/kernels/CLSelectKernel.cpp",
725 "src/runtime/CL/functions/CLSelect.cpp"
726 ]
727 }
728 },
729 "Slice": {
730 "deps": [ "StridedSlice" ],
731 "files": {
732 "common": [ "src/runtime/CL/functions/CLSlice.cpp" ]
733 }
734 },
735 "Softmax": {
736 "deps": [ "Permute" ],
737 "files": {
738 "common": [
739 "src/gpu/cl/kernels/ClSoftmaxKernel.cpp",
740 "src/gpu/cl/operators/ClSoftmax.cpp",
741 "src/runtime/CL/functions/CLSoftmaxLayer.cpp"
742 ]
743 }
744 },
745 "SpaceToBatch": {
746 "files": {
747 "common": [
748 "src/core/CL/kernels/CLSpaceToBatchLayerKernel.cpp",
749 "src/runtime/CL/functions/CLSpaceToBatchLayer.cpp"
750 ]
751 }
752 },
753 "SpaceToDepth": {
754 "files": {
755 "common": [
756 "src/core/CL/kernels/CLSpaceToDepthLayerKernel.cpp",
757 "src/runtime/CL/functions/CLSpaceToDepthLayer.cpp"
758 ]
759 }
760 },
761 "Split": {
762 "deps": [ "StridedSlice" ],
763 "files": {
764 "common": [ "src/runtime/CL/functions/CLSplit.cpp" ]
765 }
766 },
767 "Stack": {
768 "files": {
769 "common": [
770 "src/core/CL/kernels/CLStackLayerKernel.cpp",
771 "src/runtime/CL/functions/CLStackLayer.cpp"
772 ]
773 }
774 },
775 "StridedSlice": {
776 "files": {
777 "common": [
778 "src/core/CL/kernels/CLStridedSliceKernel.cpp",
779 "src/runtime/CL/functions/CLStridedSlice.cpp"
780 ]
781 }
782 },
783 "Sub": {
784 "files": {
785 "common": [
786 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
787 "src/gpu/cl/operators/ClSub.cpp"
788 ]
789 }
790 },
791 "Tile": {
792 "files": {
793 "common": [
794 "src/core/CL/kernels/CLTileKernel.cpp",
795 "src/runtime/CL/functions/CLTile.cpp"
796 ]
797 }
798 },
799 "Transpose": {
800 "files": {
801 "common": [
802 "src/gpu/cl/kernels/ClTransposeKernel.cpp",
803 "src/gpu/cl/operators/ClTranspose.cpp",
804 "src/runtime/CL/functions/CLTranspose.cpp"
805 ]
806 }
807 },
808 "Unstack": {
809 "deps": [ "StridedSlice" ],
810 "files": {
811 "common": [ "src/runtime/CL/functions/CLUnstack.cpp" ]
812 }
813 },
814 "YUVNormalize": {
815 "files": {
816 "common": [
817 "src/core/CL/kernels/CLNormalizePlanarYUVLayerKernel.cpp",
818 "src/runtime/CL/functions/CLNormalizePlanarYUVLayer.cpp"
819 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100820 }
Georgios Pinitasbdcdc392021-04-22 16:42:03 +0100821 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100822 }
823},
Michalis Spyrou20fca522021-06-07 14:23:57 +0100824 "cpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100825 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +0100826 "src/cpu/CpuContext.cpp",
827 "src/cpu/CpuQueue.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100828 "src/cpu/CpuTensor.cpp",
829 "src/core/NEON/kernels/NEFillBorderKernel.cpp",
830 "src/runtime/NEON/INEOperator.cpp",
831 "src/runtime/NEON/INESimpleFunction.cpp",
832 "src/runtime/NEON/INESimpleFunctionNoBorder.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100833 ],
834 "operators": {
835 "Activation": {
836 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100837 "common": [
838 "src/cpu/operators/CpuActivation.cpp",
839 "src/cpu/kernels/CpuActivationKernel.cpp",
Dana Zlotnika538ae52022-02-21 13:12:41 +0200840 "src/runtime/NEON/functions/NEActivationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100841 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100842 "neon": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200843 "fp16": [ "src/cpu/kernels/activation/generic/neon/fp16.cpp" ],
Dana Zlotnika538ae52022-02-21 13:12:41 +0200844 "fp32": [ "src/cpu/kernels/activation/generic/neon/fp32.cpp" ],
845 "qasymm8": [ "src/cpu/kernels/activation/generic/neon/qasymm8.cpp" ],
846 "qasymm8_signed": [ "src/cpu/kernels/activation/generic/neon/qasymm8_signed.cpp" ],
847 "qsymm16": [ "src/cpu/kernels/activation/generic/neon/qsymm16.cpp" ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100848 },
849 "sve": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200850 "fp16": [ "src/cpu/kernels/activation/generic/sve/fp16.cpp" ],
alerah01c9e519d2022-01-31 19:04:10 +0200851 "fp32": [ "src/cpu/kernels/activation/generic/sve/fp32.cpp" ]
852 },
853 "sve2":{
Dana Zlotnik32291712021-11-25 09:58:27 +0200854 "qasymm8": [ "src/cpu/kernels/activation/generic/sve2/qasymm8.cpp" ],
855 "qasymm8_signed": [ "src/cpu/kernels/activation/generic/sve2/qasymm8_signed.cpp" ],
856 "qsymm16": [ "src/cpu/kernels/activation/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100857 }
858 }
859 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100860 "ArgMinMax": {
861 "deps": [ "Reduction" ],
862 "files": {
863 "common": [ "src/runtime/NEON/functions/NEArgMinMaxLayer.cpp" ]
864 }
865 },
Michalis Spyrou20fca522021-06-07 14:23:57 +0100866 "Add": {
867 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100868 "common": [
869 "src/cpu/operators/CpuAdd.cpp",
870 "src/cpu/kernels/CpuAddKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200871 "src/runtime/NEON/functions/NEArithmeticAddition.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100872 ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200873 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200874 "common": ["src/cpu/kernels/add/generic/neon/impl.cpp"],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200875 "fp32":["src/cpu/kernels/add/generic/neon/fp32.cpp"],
876 "fp16":["src/cpu/kernels/add/generic/neon/fp16.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200877 "integer":["src/cpu/kernels/add/generic/neon/integer.cpp"],
878 "qasymm8": ["src/cpu/kernels/add/generic/neon/qasymm8.cpp"],
879 "qasymm8_signed": ["src/cpu/kernels/add/generic/neon/qasymm8_signed.cpp"],
880 "qsymm16": ["src/cpu/kernels/add/generic/neon/qsymm16.cpp"]
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200881 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100882 "sve": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200883 "common": [ "src/cpu/kernels/add/generic/sve/impl.cpp" ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200884 "integer":["src/cpu/kernels/add/generic/sve/integer.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200885 "fp32":["src/cpu/kernels/add/generic/sve/fp32.cpp"],
886 "fp16":["src/cpu/kernels/add/generic/sve/fp16.cpp"]
887 },
888 "sve2": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200889 "qasymm8": [ "src/cpu/kernels/add/generic/sve2/qasymm8.cpp" ],
890 "qasymm8_signed": [ "src/cpu/kernels/add/generic/sve2/qasymm8_signed.cpp" ],
891 "qsymm16": [ "src/cpu/kernels/add/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100892 }
893 }
894 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100895 "BatchNormalize": {
Michalis Spyrou20fca522021-06-07 14:23:57 +0100896 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100897 "common": [
898 "src/core/NEON/kernels/NEBatchNormalizationLayerKernel.cpp",
899 "src/core/NEON/kernels/NEFuseBatchNormalizationKernel.cpp",
900 "src/runtime/NEON/functions/NEBatchNormalizationLayer.cpp",
901 "src/runtime/NEON/functions/NEFuseBatchNormalization.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100902 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100903 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100904 "fp16": [ "src/core/NEON/kernels/batchnormalization/impl/NEON/fp16.cpp" ],
905 "fp32": [ "src/core/NEON/kernels/batchnormalization/impl/NEON/fp32.cpp" ]
906 },
907 "sve": {
908 "fp16": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp16.cpp" ],
909 "fp32": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp32.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100910 }
911 }
912 },
913 "BatchToSpace": {
914 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100915 "common": [
916 "src/core/NEON/kernels/NEBatchToSpaceLayerKernel.cpp",
917 "src/runtime/NEON/functions/NEBatchToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100918 ]
919 }
920 },
921 "BitwiseAnd": {
922 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100923 "common": [
924 "src/core/NEON/kernels/NEBitwiseAndKernel.cpp",
925 "src/runtime/NEON/functions/NEBitwiseAnd.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100926 ]
927 }
928 },
929 "BitwiseNot": {
930 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100931 "common": [
932 "src/core/NEON/kernels/NEBitwiseNotKernel.cpp",
933 "src/runtime/NEON/functions/NEBitwiseNot.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100934 ]
935 }
936 },
937 "BitwiseOr": {
938 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100939 "common": [
940 "src/core/NEON/kernels/NEBitwiseOrKernel.cpp",
941 "src/runtime/NEON/functions/NEBitwiseOr.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100942 ]
943 }
944 },
945 "BitwiseXor": {
946 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100947 "common": [
948 "src/core/NEON/kernels/NEBitwiseXorKernel.cpp",
949 "src/runtime/NEON/functions/NEBitwiseXor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100950 ]
951 }
952 },
953 "BoundingBoxTransform": {
954 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100955 "common": [
956 "src/core/NEON/kernels/NEBoundingBoxTransformKernel.cpp",
957 "src/runtime/NEON/functions/NEBoundingBoxTransform.cpp"
Dana Zlotnik3475ffe2022-01-03 14:37:10 +0200958 ],
959 "neon":{
960 "common":["src/cpu/kernels/boundingboxtransform/generic/neon/impl.cpp"],
961 "fp32":["src/cpu/kernels/boundingboxtransform/generic/neon/fp32.cpp"],
962 "fp16":["src/cpu/kernels/boundingboxtransform/generic/neon/fp16.cpp"],
963 "qsymm16":["src/cpu/kernels/boundingboxtransform/generic/neon/qsymm16.cpp"]
Dana Zlotnik3475ffe2022-01-03 14:37:10 +0200964 }
Michalis Spyrou20fca522021-06-07 14:23:57 +0100965 }
966 },
967 "Cast": {
968 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100969 "common": [
970 "src/cpu/operators/CpuCast.cpp",
971 "src/cpu/kernels/CpuCastKernel.cpp",
972 "src/runtime/NEON/functions/NECast.cpp"
973 ]
974 }
975 },
976 "ChannelShuffle": {
977 "files": {
978 "common": [
979 "src/core/NEON/kernels/NEChannelShuffleLayerKernel.cpp",
980 "src/runtime/NEON/functions/NEChannelShuffleLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100981 ]
982 }
983 },
984 "Concatenate": {
985 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100986 "common": [
987 "src/cpu/operators/CpuConcatenate.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +0100988 "src/cpu/kernels/CpuConcatenateWidthKernel.cpp",
989 "src/cpu/kernels/CpuConcatenateBatchKernel.cpp",
990 "src/cpu/kernels/CpuConcatenateDepthKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100991 "src/cpu/kernels/CpuConcatenateHeightKernel.cpp",
992 "src/runtime/NEON/functions/NEConcatenateLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100993 ]
994 }
995 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100996 "Conv2d": {
997 "deps": [
998 "Activation",
999 "ElementwiseBinary",
1000 "FFT2D",
1001 "Gemm",
1002 "Mul",
1003 "Pad",
1004 "Permute",
1005 "Reshape",
1006 "Reverse",
1007 "Slice"
1008 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001009 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001010 "common": [
1011 "src/cpu/operators/CpuConv2d.cpp",
1012 "src/cpu/operators/CpuDirectConv2d.cpp",
1013 "src/cpu/operators/CpuGemmDirectConv2d.cpp",
1014 "src/cpu/operators/CpuGemmConv2d.cpp",
1015 "src/cpu/operators/CpuWinogradConv2d.cpp",
1016 "src/cpu/operators/internal/CpuGemmAssemblyDispatch.cpp",
1017 "src/cpu/kernels/CpuDirectConv2dKernel.cpp",
1018 "src/cpu/kernels/CpuDirectConv2dOutputStageKernel.cpp",
1019 "src/cpu/kernels/CpuWinogradConv2dKernel.cpp",
1020 "src/cpu/kernels/CpuCol2ImKernel.cpp",
1021 "src/cpu/kernels/CpuIm2ColKernel.cpp",
1022 "src/cpu/kernels/CpuWeightsReshapeKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001023 "src/runtime/NEON/functions/NEConvolutionLayer.cpp",
1024 "src/runtime/NEON/functions/NEDirectConvolutionLayer.cpp",
1025 "src/runtime/NEON/functions/NEFFTConvolutionLayer.cpp",
1026 "src/runtime/NEON/functions/NEGEMMConv2d.cpp",
1027 "src/runtime/NEON/functions/NEGEMMConvolutionLayer.cpp",
1028 "src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001029 ],
1030 "neon": {
1031 "common": [
1032 "src/core/NEON/kernels/convolution/common/padding.cpp",
1033 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1034 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1035 "src/core/NEON/kernels/convolution/common/utils.cpp",
1036 "src/core/NEON/kernels/convolution/winograd/padding.cpp",
1037 "src/core/NEON/kernels/convolution/winograd/winograd.cpp",
1038 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/input_1x8_fp32_fp32_integers.cpp",
1039 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/input_4x4_fp16_fp16_integers.cpp",
1040 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/input_4x4_fp32_fp32_integers.cpp",
1041 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/input_6x6_fp16_fp16_integers.cpp",
1042 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/input_6x6_fp32_fp32_integers.cpp",
1043 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/output_2_7_fp32_fp32_integers.cpp",
1044 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/output_2x2_3x3_fp32_fp32_integers.cpp",
1045 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/output_2x2_5x5_fp32_fp32_integers.cpp",
1046 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/output_4_5_fp32_fp32_integers.cpp",
1047 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/output_4x4_3x3_fp16_fp16_integers.cpp",
1048 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/output_4x4_3x3_fp32_fp32_integers.cpp",
1049 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/output_6_3_fp32_fp32_integers.cpp",
1050 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/weights_2_7_fp32_fp32_integers.cpp",
1051 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/weights_2x2_3x3_fp32_fp32_integers.cpp",
1052 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/weights_2x2_5x5_fp32_fp32_integers.cpp",
1053 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/weights_4_5_fp32_fp32_integers.cpp",
1054 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/weights_4x4_3x3_fp16_fp16_integers.cpp",
1055 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/weights_4x4_3x3_fp32_fp32_integers.cpp",
alerah01c9e519d2022-01-31 19:04:10 +02001056 "src/core/NEON/kernels/convolution/winograd/winograd_transforms/weights_6_3_fp32_fp32_integers.cpp",
1057 "src/cpu/kernels/directconv2d/nhwc/neon/impl.cpp",
1058 "src/cpu/kernels/directconv2d/nchw/all.cpp"
1059 ],
1060 "fp32": [
1061 "src/cpu/kernels/directconv2d/nhwc/neon/fp32.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001062 ]
1063 }
Michalis Spyroub55f8e82021-07-22 11:23:11 +01001064 }
1065 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001066 "Copy": {
1067 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001068 "common": [
1069 "src/cpu/operators/CpuCopy.cpp",
1070 "src/cpu/kernels/CpuCopyKernel.cpp",
1071 "src/runtime/NEON/functions/NECopy.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001072 ]
1073 }
1074 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001075 "CropResize": {
1076 "deps": [ "Scale" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001077 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001078 "common": [
1079 "src/core/NEON/kernels/NECropKernel.cpp",
1080 "src/runtime/NEON/functions/NECropResize.cpp"
alerah0127619932021-11-24 17:21:43 +02001081 ],
1082 "neon": {
1083 "common": [ "src/cpu/kernels/crop/generic/neon/impl.cpp" ],
1084 "fp32": [ "src/cpu/kernels/crop/generic/neon/fp32.cpp" ],
1085 "fp16": [ "src/cpu/kernels/crop/generic/neon/fp16.cpp" ],
1086 "integer": [ "src/cpu/kernels/crop/generic/neon/integer.cpp" ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001087 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001088 }
1089 },
1090 "Deconv2d": {
1091 "deps": [ "Conv2d", "Reverse", "Transpose"],
1092 "files": {
1093 "common": [
1094 "src/runtime/NEON/functions/NEDeconvolutionLayer.cpp"
1095 ]
1096 }
1097 },
1098 "DepthConvert": {
1099 "deps": [ "Cast"],
1100 "files": {
1101 "common": [
1102 "src/runtime/NEON/functions/NEDepthConvertLayer.cpp"
1103 ]
1104 }
1105 },
1106 "DepthToSpace": {
1107 "files": {
1108 "common": [
1109 "src/core/NEON/kernels/NEDepthToSpaceLayerKernel.cpp",
1110 "src/runtime/NEON/functions/NEDepthToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001111 ]
1112 }
1113 },
1114 "DepthwiseConv2d": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001115 "deps": [ "Activation", "Permute" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001116 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001117 "common": [
Georgios Pinitas7891a732021-08-20 21:39:25 +01001118 "src/cpu/operators/CpuDepthwiseConv2d.cpp",
1119 "src/cpu/operators/CpuDepthwiseConv2dAssemblyDispatch.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001120 "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.cpp",
1121 "src/cpu/kernels/internal/CpuDepthwiseConv2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001122 "src/runtime/NEON/functions/NEDepthwiseConvolutionLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001123 ],
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001124 "neon": {
1125 "common": [
1126 "src/core/NEON/kernels/convolution/common/padding.cpp",
1127 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1128 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1129 "src/core/NEON/kernels/convolution/common/utils.cpp",
1130 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp16.cpp",
1131 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8q.cpp",
1132 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8s8u8q.cpp",
1133 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/8b_mla.cpp",
1134 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_s8q.cpp",
1135 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp32.cpp",
1136 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1137 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1138 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1139 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1140 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1141 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1142 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1143 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1144 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1145 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1146 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1147 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1148 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1149 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1150 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1151 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1152 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1153 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1154 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1155 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1156 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1157 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1158 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1159 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1160 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1161 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1162 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1163 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1164 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1165 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1166 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1167 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1168 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1169 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1170 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1171 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1172 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1173 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1174 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1175 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1176 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1177 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1178 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1179 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1180 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1181 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1182 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1183 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1184 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_s8q_3x3_dot.cpp",
Dana Zlotnikebbae942022-02-03 12:52:15 +02001185 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_u8q_3x3_dot.cpp",
1186 "src/cpu/kernels/depthwiseconv2d/generic/neon/impl.cpp"
1187 ],
1188 "fp16":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp16.cpp"],
1189 "fp32":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp32.cpp"],
1190 "qasymm8":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8.cpp"],
1191 "qasymm8_signed":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8_signed.cpp"]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001192 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001193 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001194 "common": [
Freddie Liardetd216f572021-08-03 15:57:32 +01001195 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_8b_mla.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001196 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_s8q_3x3_dot.cpp",
1197 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_u8q_3x3_dot.cpp",
1198 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1199 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1200 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1201 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1202 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1203 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1204 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1205 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1206 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1207 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1208 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1209 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1210 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1211 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst_strided/generic.cpp",
1212 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1213 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1214 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1215 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1216 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1217 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1218 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1219 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1220 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1221 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1222 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1223 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1224 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1225 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1226 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1227 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1228 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1229 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1230 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1231 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1232 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1233 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1234 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1235 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1236 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1237 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1238 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
Freddie Liardet487d3902021-09-21 12:36:43 +01001239 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001240 ]
1241 }
1242 }
1243 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001244 "Dequantize": {
1245 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001246 "common": [
1247 "src/cpu/operators/CpuDequantize.cpp",
1248 "src/cpu/kernels/CpuDequantizeKernel.cpp",
1249 "src/runtime/NEON/functions/NEDequantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001250 ]
1251 }
1252 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001253 "DetectionPostProcess": {
1254 "deps": [ "Dequantize" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001255 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001256 "common" : [ "src/runtime/NEON/functions/NEDetectionPostProcessLayer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001257 }
1258 },
Sheri Zhang6d9c9822021-09-24 16:02:57 +01001259 "Conv3d": {
1260 "deps": [
1261 "Activation"
1262 ],
1263 "files": {
1264 "common": [
1265 "src/cpu/operators/CpuDirectConv3d.cpp",
1266 "src/cpu/kernels/CpuDirectConv3dKernel.cpp",
1267 "src/runtime/NEON/functions/NEConv3D.cpp"
1268 ]
1269 }
1270 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001271 "ElementwiseBinary": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001272 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001273 "common": [
1274 "src/cpu/operators/CpuElementwise.cpp",
1275 "src/cpu/kernels/CpuElementwiseKernel.cpp",
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001276 "src/runtime/NEON/functions/NEElementwiseOperations.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001277 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001278 "neon":{
1279 "fp32": ["src/cpu/kernels/elementwise_binary/generic/neon/fp32.cpp"],
1280 "fp16": ["src/cpu/kernels/elementwise_binary/generic/neon/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001281 "integer": ["src/cpu/kernels/elementwise_binary/generic/neon/integer.cpp"],
1282 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8.cpp"],
1283 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001284 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001285 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001286 "common": ["src/cpu/kernels/elementwise_binary/generic/sve/impl.cpp" ],
1287 "integer": ["src/cpu/kernels/elementwise_binary/generic/sve/integer.cpp"],
1288 "fp32": ["src/cpu/kernels/elementwise_binary/generic/sve/fp32.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001289 "fp16": ["src/cpu/kernels/elementwise_binary/generic/sve/fp16.cpp"]
1290
1291 },
1292 "sve2":{
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001293 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8.cpp"],
1294 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001295 }
1296 }
1297 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001298 "ElementwiseUnary":{
Michalis Spyrou20fca522021-06-07 14:23:57 +01001299 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001300 "common": [
1301 "src/cpu/operators/CpuElementwiseUnary.cpp",
1302 "src/cpu/kernels/CpuElementwiseUnaryKernel.cpp",
1303 "src/runtime/NEON/functions/NEElementwiseUnaryLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001304 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001305 "neon": {
Dana Zlotnika538ae52022-02-21 13:12:41 +02001306 "common":["src/cpu/kernels/elementwise_unary/generic/neon/impl.cpp"],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001307 "integer": ["src/cpu/kernels/elementwise_unary/generic/neon/integer.cpp"],
1308 "fp32": ["src/cpu/kernels/elementwise_unary/generic/neon/fp32.cpp"],
1309 "fp16": ["src/cpu/kernels/elementwise_unary/generic/neon/fp16.cpp"]
1310 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001311 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001312 "common": ["src/cpu/kernels/elementwise_unary/generic/sve/impl.cpp" ],
1313 "integer": ["src/cpu/kernels/elementwise_unary/generic/sve/integer.cpp"],
1314 "fp32": ["src/cpu/kernels/elementwise_unary/generic/sve/fp32.cpp"],
1315 "fp16": ["src/cpu/kernels/elementwise_unary/generic/sve/fp16.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001316 }
1317 }
1318 },
1319 "FFT1D": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001320 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001321 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001322 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001323 "src/core/NEON/kernels/NEFFTDigitReverseKernel.cpp",
1324 "src/core/NEON/kernels/NEFFTRadixStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001325 "src/core/NEON/kernels/NEFFTScaleKernel.cpp",
1326 "src/runtime/NEON/functions/NEFFT1D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001327 ]
1328 }
1329 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001330 "FFT2D": {
1331 "deps": [ "FFT1D" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001332 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001333 "common": [
1334 "src/runtime/NEON/functions/NEFFT2D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001335 ]
1336 }
1337 },
1338 "Fill": {
1339 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001340 "common": [
1341 "src/cpu/operators/CpuFill.cpp",
1342 "src/cpu/kernels/CpuFillKernel.cpp",
1343 "src/runtime/NEON/functions/NEFill.cpp"
1344 ]
1345 }
1346 },
1347 "Flatten": {
1348 "deps: ": [ "Reshape" ],
1349 "files": {
1350 "common": [
1351 "src/cpu/operators/CpuFlatten.cpp",
1352 "src/runtime/NEON/functions/NEFlattenLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001353 ]
1354 }
1355 },
1356 "Floor": {
1357 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001358 "common": [
1359 "src/cpu/operators/CpuFloor.cpp",
1360 "src/cpu/kernels/CpuFloorKernel.cpp",
1361 "src/runtime/NEON/functions/NEFloor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001362 ],
1363 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001364 "fp32": [ "src/cpu/kernels/floor/neon/fp32.cpp" ],
1365 "fp16": [ "src/cpu/kernels/floor/neon/fp16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001366 }
1367 }
1368 },
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001369 "FullyConnected": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001370 "deps": [ "Flatten", "Gemm", "Transpose"],
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001371 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001372 "common": [
1373 "src/cpu/kernels/CpuConvertFullyConnectedWeightsKernel.cpp",
1374 "src/cpu/operators/CpuConvertFullyConnectedWeights.cpp",
1375 "src/cpu/operators/CpuFullyConnected.cpp",
1376 "src/runtime/NEON/functions/NEConvertFullyConnectedWeights.cpp",
1377 "src/runtime/NEON/functions/NEFullyConnectedLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001378 ]
1379 }
1380 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001381 "Gather": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001382 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001383 "common": [
1384 "src/core/NEON/kernels/NEGatherKernel.cpp",
1385 "src/runtime/NEON/functions/NEGather.cpp"
1386 ]
1387 }
1388 },
1389 "Gemm": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001390 "deps": [ "Quantize", "Add"],
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001391 "files": {
1392 "common": [
1393 "src/cpu/kernels/CpuConvertQuantizedSignednessKernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001394 "src/cpu/kernels/CpuGemmMatrixAdditionKernel.cpp",
1395 "src/cpu/kernels/CpuGemmMatrixMultiplyKernel.cpp",
1396 "src/cpu/kernels/CpuGemmTranspose1xWKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001397 "src/cpu/kernels/CpuGemmInterleave4x4Kernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001398 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ScaleKernel.cpp",
1399 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt16ScaleByFixedPointKernel.cpp",
1400 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt8ScaleByFixedPointKernel.cpp",
1401 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToUint8ScaleByFixedPointKernel.cpp",
1402 "src/cpu/kernels/CpuGemmLowpMatrixMultiplyKernel.cpp",
1403 "src/cpu/kernels/CpuGemmLowpMatrixReductionKernel.cpp",
1404 "src/cpu/kernels/CpuGemmLowpOffsetContributionOutputStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001405 "src/cpu/kernels/CpuGemmLowpOffsetContributionKernel.cpp",
1406 "src/cpu/operators/CpuGemm.cpp",
1407 "src/cpu/operators/CpuGemmLowpOutputStage.cpp",
1408 "src/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001409 "src/runtime/NEON/functions/NEGEMM.cpp",
1410 "src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001411 "src/runtime/NEON/functions/NEGEMMLowpOutputStage.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001412 ],
1413 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001414 "common": [
1415 "src/core/NEON/kernels/arm_gemm/gemm_bf16.cpp",
1416 "src/core/NEON/kernels/arm_gemm/gemm_fp16.cpp",
1417 "src/core/NEON/kernels/arm_gemm/gemm_fp32.cpp",
1418 "src/core/NEON/kernels/arm_gemm/gemm_int16.cpp",
1419 "src/core/NEON/kernels/arm_gemm/gemm_int8.cpp",
1420 "src/core/NEON/kernels/arm_gemm/gemm_qint8.cpp",
1421 "src/core/NEON/kernels/arm_gemm/gemm_quint8.cpp",
1422 "src/core/NEON/kernels/arm_gemm/gemm_uint16.cpp",
1423 "src/core/NEON/kernels/arm_gemm/gemm_uint8.cpp",
1424 "src/core/NEON/kernels/arm_gemm/interleave_indirect.cpp",
1425 "src/core/NEON/kernels/arm_gemm/mergeresults-fp16.cpp",
1426 "src/core/NEON/kernels/arm_gemm/mergeresults.cpp",
1427 "src/core/NEON/kernels/arm_gemm/misc.cpp",
1428 "src/core/NEON/kernels/arm_gemm/quantized.cpp",
1429 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_s8.cpp",
1430 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_u8.cpp",
1431 "src/core/NEON/kernels/arm_gemm/transform.cpp",
1432 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s16_8x12/generic.cpp",
1433 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_4x4/generic.cpp",
1434 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/a55r1.cpp",
1435 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/generic.cpp",
1436 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/x1.cpp",
1437 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u16_8x12/generic.cpp",
1438 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4/generic.cpp",
1439 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/a55r1.cpp",
1440 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/generic.cpp",
1441 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/x1.cpp",
1442 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/a55r1.cpp",
1443 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/generic.cpp",
1444 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/x1.cpp",
1445 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_dot_6x16/generic.cpp",
1446 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_mmla_6x16/generic.cpp",
1447 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/a55.cpp",
1448 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/generic.cpp",
1449 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/a55.cpp",
1450 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/generic.cpp",
1451 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/a55.cpp",
1452 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/generic.cpp",
1453 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/a55.cpp",
1454 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/generic.cpp",
1455 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1456 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_6x16/generic.cpp",
1457 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/a55.cpp",
1458 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/generic.cpp",
1459 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_mmla_4x16/generic.cpp",
1460 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/a55.cpp",
1461 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/generic.cpp",
1462 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_mmla_6x16/generic.cpp",
1463 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/a55.cpp",
1464 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/generic.cpp",
1465 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_mmla_6x16/generic.cpp",
1466 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/a55.cpp",
1467 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/generic.cpp",
1468 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_mmla_4x16/generic.cpp",
1469 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/a55.cpp",
1470 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/generic.cpp",
1471 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_mmla_6x16/generic.cpp",
1472 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/generic.cpp",
1473 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/x1.cpp",
1474 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/generic.cpp",
1475 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/a510.cpp",
1476 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/generic.cpp",
1477 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/a510.cpp",
1478 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/generic.cpp",
1479 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/a510.cpp",
1480 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a53.cpp",
1481 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55.cpp",
1482 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55r1.cpp",
1483 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/generic.cpp",
1484 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/x1.cpp",
1485 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x6/generic.cpp",
1486 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_6x4/generic.cpp",
1487 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_8x4/generic.cpp",
1488 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/a55.cpp",
1489 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/generic.cpp",
1490 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/a55.cpp",
1491 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/generic.cpp",
1492 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/a55.cpp",
1493 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/generic.cpp",
1494 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/a55.cpp",
Dana Zlotnik256ac622022-02-02 15:06:11 +02001495 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/generic.cpp",
1496 "src/cpu/kernels/gemm_matrix_mul/generic/neon/impl.cpp",
1497 "src/cpu/kernels/gemm_matrix_add/generic/neon/impl.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001498 ],
Dana Zlotnik256ac622022-02-02 15:06:11 +02001499 "fp32":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp32.cpp",
1500 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp32.cpp"],
1501 "fp16":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp16.cpp",
1502 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp16.cpp"],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001503 "estate32": [
1504 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a53.cpp",
1505 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a55r1.cpp",
1506 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/generic.cpp"
1507 ],
1508 "estate64": [
Freddie Liardet487d3902021-09-21 12:36:43 +01001509 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemv_pretransposed/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001510 ]
1511 },
1512 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001513 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001514 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001515 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1516 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001517 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001518 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001519 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001520 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001521 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001522 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1523 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001524 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001525 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_mmla_4x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001526 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001527 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_mmla_6x4VL/generic.cpp",
1528 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001529 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001530 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001531 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001532 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_mmla_4x4VL/generic.cpp",
1533 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001534 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001535 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001536 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_dot_8x3VL/generic.cpp",
1537 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001538 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001539 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001540 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001541 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/generic.cpp",
1542 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001543 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001544 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/generic.cpp",
1545 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001546 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001547 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/generic.cpp",
1548 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_mmla_8x3VL/generic.cpp",
1549 "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_fp32_mla_8x1VL/generic.cpp",
1550 "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_s8s32_dot_8x1VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001551 "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_u8u32_dot_8x1VL/generic.cpp",
1552 "src/core/NEON/kernels/arm_gemm/mergeresults-sve.cpp",
Freddie Liardet487d3902021-09-21 12:36:43 +01001553 "src/core/NEON/kernels/arm_gemm/transform-sve.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001554 ]
1555 }
1556 }
1557 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001558 "GenerateProposals": {
1559 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001560 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001561 "common": [
1562 "src/core/NEON/kernels/NEGenerateProposalsLayerKernel.cpp",
1563 "src/runtime/NEON/functions/NEGenerateProposalsLayer.cpp"
Dana Zlotnik50ce2772021-12-29 13:55:56 +02001564 ],
1565 "neon":{
1566 "common":["src/cpu/kernels/genproposals/generic/neon/impl.cpp"],
1567 "fp16":["src/cpu/kernels/genproposals/generic/neon/fp16.cpp"],
1568 "fp32":["src/cpu/kernels/genproposals/generic/neon/fp32.cpp"],
1569 "qsymm16":["src/cpu/kernels/genproposals/generic/neon/qsymm16.cpp"]
1570 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001571 }
1572 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001573 "InstanceNormalize": {
1574 "deps": [ "Permute", "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001575 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001576 "common": [
1577 "src/core/NEON/kernels/NEInstanceNormalizationLayerKernel.cpp",
1578 "src/runtime/NEON/functions/NEInstanceNormalizationLayer.cpp"
Dana Zlotnikd7e2ec52022-01-03 10:59:41 +02001579 ],
1580 "neon":{
1581 "common":["src/cpu/kernels/instancenorm/generic/neon/impl.cpp"],
1582 "fp16":["src/cpu/kernels/instancenorm/generic/neon/fp16.cpp"],
1583 "fp32":["src/cpu/kernels/instancenorm/generic/neon/fp32.cpp"]
1584 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001585 }
1586 },
1587 "L2Normalize": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001588 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001589 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001590 "common": [
1591 "src/core/NEON/kernels/NEL2NormalizeLayerKernel.cpp",
1592 "src/runtime/NEON/functions/NEL2NormalizeLayer.cpp"
Yair Schwarzbaum5e993182022-01-10 15:11:07 +02001593 ],
1594 "neon":{
1595 "common":["src/cpu/kernels/l2normlayer/generic/neon/impl.cpp"],
1596 "fp32":["src/cpu/kernels/l2normlayer/generic/neon/fp32.cpp"],
1597 "fp16":["src/cpu/kernels/l2normlayer/generic/neon/fp16.cpp"]
1598 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001599 }
1600 },
1601 "Logical": {
1602 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001603 "common": [
1604 "src/core/NEON/kernels/NELogicalKernel.cpp",
1605 "src/runtime/NEON/functions/NELogical.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001606 ]
1607 }
1608 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001609 "LSTM": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001610 "deps": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001611 "Activation",
1612 "Concatenate",
1613 "Copy",
1614 "Dequantize",
1615 "ElementwiseBinary",
1616 "Fill",
1617 "FullyConnected",
1618 "Gemm",
1619 "MeanStdDevNormalize",
1620 "Mul",
1621 "Quantize",
1622 "Slice",
1623 "Transpose"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001624 ],
1625 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001626 "common": [
1627 "src/core/NEON/kernels/NEQLSTMLayerNormalizationKernel.cpp",
1628 "src/runtime/NEON/functions/NELSTMLayer.cpp",
1629 "src/runtime/NEON/functions/NELSTMLayerQuantized.cpp",
1630 "src/runtime/NEON/functions/NEQLSTMLayer.cpp"
1631 ]
1632 }
1633 },
1634 "MaxUnpool2d": {
1635 "deps": [ "Fill" ],
1636 "files": {
1637 "common": [
Dana Zlotnik149203b2022-01-26 12:38:03 +02001638 "src/cpu/kernels/CpuMaxUnpoolingLayerKernel.cpp",
1639 "src/runtime/NEON/functions/NEMaxUnpoolingLayer.cpp",
1640 "src/cpu/operators/CpuMaxUnpooling.cpp"
Dana Zlotnik143310c2021-12-30 13:24:52 +02001641 ],
1642 "neon":{
Dana Zlotnik143310c2021-12-30 13:24:52 +02001643 "fp32":["src/cpu/kernels/maxunpool/generic/neon/fp32.cpp"],
1644 "fp16":["src/cpu/kernels/maxunpool/generic/neon/fp16.cpp"],
1645 "qasymm8":["src/cpu/kernels/maxunpool/generic/neon/qasymm8.cpp"],
Dana Zlotnik149203b2022-01-26 12:38:03 +02001646 "qasymm8_signed":[ "src/cpu/kernels/maxunpool/generic/neon/qasymm8_signed.cpp"],
1647 "common":["src/cpu/kernels/maxunpool/generic/neon/impl.cpp"]
Dana Zlotnik143310c2021-12-30 13:24:52 +02001648 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001649 }
1650 },
1651 "Mean": {
1652 "deps" : [ "Reduction" ],
1653 "files": {
1654 "common": [ "src/runtime/NEON/functions/NEReduceMean.cpp" ]
1655 }
1656 },
1657 "MeanStdDevNormalize": {
1658 "files": {
1659 "common": [
1660 "src/core/NEON/kernels/NEMeanStdDevNormalizationKernel.cpp",
1661 "src/runtime/NEON/functions/NEMeanStdDevNormalizationLayer.cpp"
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001662 ],
1663 "neon":{
1664 "common":["src/cpu/kernels/meanstddevnorm/generic/neon/impl.cpp"],
1665 "fp32":["src/cpu/kernels/meanstddevnorm/generic/neon/fp32.cpp"],
1666 "fp16":["src/cpu/kernels/meanstddevnorm/generic/neon/fp16.cpp"]
1667 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001668 }
1669 },
1670 "Mul": {
1671 "files": {
1672 "common": [
1673 "src/cpu/operators/CpuMul.cpp",
1674 "src/cpu/kernels/CpuMulKernel.cpp",
1675 "src/runtime/NEON/functions/NEPixelWiseMultiplication.cpp"
1676 ]
1677 }
1678 },
1679 "Normalize": {
1680 "deps": [ "Mul" ],
1681 "files": {
1682 "common": [
1683 "src/core/NEON/kernels/NENormalizationLayerKernel.cpp",
1684 "src/runtime/NEON/functions/NENormalizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001685 ]
1686 }
1687 },
1688 "Pad": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001689 "deps": [ "Concatenate", "Copy", "StridedSlice" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001690 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001691 "common": [
1692 "src/core/NEON/kernels/NEPadLayerKernel.cpp",
1693 "src/runtime/NEON/functions/NEPadLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001694 ]
1695 }
1696 },
1697 "Permute": {
1698 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001699 "common": [
1700 "src/cpu/operators/CpuPermute.cpp",
1701 "src/cpu/kernels/CpuPermuteKernel.cpp",
1702 "src/runtime/NEON/functions/NEPermute.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001703 ]
1704 }
1705 },
1706 "Pool2d": {
1707 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001708 "common": [
1709 "src/cpu/operators/CpuPool2d.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001710 "src/cpu/kernels/CpuPool2dKernel.cpp",
1711 "src/cpu/kernels/internal/CpuPool2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001712 "src/runtime/NEON/functions/NEPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001713 ],
1714 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001715 "common": [
1716 "src/core/NEON/kernels/arm_conv/pooling/kernels/cpp_nhwc_1x1_stride_any_depthfirst/generic.cpp",
1717 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp16.cpp",
1718 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp32.cpp",
1719 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8.cpp",
1720 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8q.cpp",
1721 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8.cpp",
1722 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8q.cpp",
1723 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1724 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1725 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1726 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1727 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1728 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1729 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1730 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1731 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1732 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1733 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_generic_depthfirst/generic.cpp",
1734 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1735 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1736 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1737 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1738 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_generic_depthfirst/generic.cpp",
1739 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
1740 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_max_generic_depthfirst/generic.cpp"
1741 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001742 "nchw": [ "src/cpu/kernels/pool2d/neon/nchw/all.cpp" ],
1743 "fp16": [ "src/cpu/kernels/pool2d/neon/fp16.cpp" ],
Dana Zlotnika538ae52022-02-21 13:12:41 +02001744 "fp32": [ "src/cpu/kernels/pool2d/neon/fp32.cpp" ],
1745 "qasymm8":[ "src/cpu/kernels/pool2d/neon/qasymm8.cpp" ],
1746 "qasymm8_signed":["src/cpu/kernels/pool2d/neon/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001747 },
1748 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001749 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001750 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1751 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1752 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1753 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_generic_depthfirst/generic.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001754 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1755 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1756 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1757 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_generic_depthfirst/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001758 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1759 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1760 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_generic_depthfirst/generic.cpp",
1761 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1762 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1763 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1764 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1765 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_generic_depthfirst/generic.cpp",
1766 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
Freddie Liardet487d3902021-09-21 12:36:43 +01001767 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001768 ]
1769 }
1770 }
1771 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001772 "PRelu": {
1773 "deps": [ "ElementwiseBinary" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001774 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001775 "common": [
1776 "src/runtime/NEON/functions/NEPReluLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001777 ]
1778 }
1779 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001780 "PriorBox": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001781 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001782 "common": [
1783 "src/core/NEON/kernels/NEPriorBoxLayerKernel.cpp",
1784 "src/runtime/NEON/functions/NEPriorBoxLayer.cpp"
1785 ]
1786 }
1787 },
1788 "Quantize": {
1789 "files": {
1790 "common": [
1791 "src/cpu/operators/CpuQuantize.cpp",
1792 "src/cpu/kernels/CpuQuantizeKernel.cpp",
1793 "src/runtime/NEON/functions/NEQuantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001794 ]
1795 }
1796 },
1797 "Range": {
1798 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001799 "common": [
1800 "src/core/NEON/kernels/NERangeKernel.cpp",
1801 "src/runtime/NEON/functions/NERange.cpp"
Yair Schwarzbaum9e8a7702021-11-08 10:58:06 +02001802 ],
1803 "neon": {
1804 "common": [ "src/cpu/kernels/range/generic/neon/impl.cpp" ],
1805 "fp32": [ "src/cpu/kernels/range/generic/neon/fp32.cpp" ],
1806 "fp16": [ "src/cpu/kernels/range/generic/neon/fp16.cpp" ],
1807 "integer": [ "src/cpu/kernels/range/generic/neon/integer.cpp" ]
1808 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001809 }
1810 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001811 "Reduction":{
1812 "deps": [ "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001813 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001814 "common": [
1815 "src/core/NEON/kernels/NEReductionOperationKernel.cpp",
1816 "src/runtime/NEON/functions/NEReductionOperation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001817 ]
1818 }
1819 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001820 "Reorg": {
1821 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001822 "common": [
1823 "src/core/NEON/kernels/NEReorgLayerKernel.cpp",
1824 "src/runtime/NEON/functions/NEReorgLayer.cpp"
1825 ]
1826 }
1827 },
1828 "Reshape": {
1829 "files": {
1830 "common": [
1831 "src/cpu/operators/CpuReshape.cpp",
1832 "src/cpu/kernels/CpuReshapeKernel.cpp",
1833 "src/runtime/NEON/functions/NEReshapeLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001834 ]
1835 }
1836 },
1837 "Reverse": {
1838 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001839 "common": [
1840 "src/core/NEON/kernels/NEReverseKernel.cpp",
1841 "src/runtime/NEON/functions/NEReverse.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001842 ]
1843 }
1844 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001845 "RNN": {
1846 "deps": [ "Activation", "Add", "FullyConnected", "Gemm"],
1847 "files": {
1848 "common": [ "src/runtime/NEON/functions/NERNNLayer.cpp" ]
1849 }
1850 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001851 "ROIAlign": {
1852 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001853 "common": [
1854 "src/core/NEON/kernels/NEROIAlignLayerKernel.cpp",
1855 "src/runtime/NEON/functions/NEROIAlignLayer.cpp"
Dana Zlotnik9ae5a4e2022-01-03 16:22:47 +02001856 ],
1857 "neon":{
1858 "common":["src/cpu/kernels/roialign/generic/neon/impl.cpp"],
1859 "fp32":["src/cpu/kernels/roialign/generic/neon/fp32.cpp"],
1860 "fp16":["src/cpu/kernels/roialign/generic/neon/fp16.cpp"],
1861 "qasymm8":["src/cpu/kernels/roialign/generic/neon/qasymm8.cpp"],
1862 "qasymm8_signed":["src/cpu/kernels/roialign/generic/neon/qasymm8_signed.cpp"]
1863 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001864 }
1865 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001866 "ROIPool2d": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001867 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001868 "common": [
1869 "src/core/NEON/kernels/NEROIPoolingLayerKernel.cpp",
1870 "src/runtime/NEON/functions/NEROIPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001871 ]
1872 }
1873 },
1874 "Scale": {
1875 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001876 "common": [
1877 "src/cpu/operators/CpuScale.cpp",
1878 "src/cpu/kernels/CpuScaleKernel.cpp",
1879 "src/runtime/NEON/functions/NEScale.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001880 ],
1881 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001882 "fp16": [ "src/cpu/kernels/scale/sve/fp16.cpp" ],
1883 "fp32": [ "src/cpu/kernels/scale/sve/fp32.cpp" ],
1884 "integer": [ "src/cpu/kernels/scale/sve/integer.cpp" ],
1885 "qasymm8": [ "src/cpu/kernels/scale/sve/qasymm8.cpp" ],
1886 "qasymm8_signed": [ "src/cpu/kernels/scale/sve/qasymm8_signed.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001887 },
1888 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001889 "fp16": [ "src/cpu/kernels/scale/neon/fp16.cpp" ],
1890 "integer": [ "src/cpu/kernels/scale/neon/integer.cpp" ],
1891 "qasymm8": [ "src/cpu/kernels/scale/neon/qasymm8.cpp" ],
1892 "qasymm8_signed": [ "src/cpu/kernels/scale/neon/qasymm8_signed.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001893 }
1894 }
1895 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001896 "Select": {
1897 "files": {
1898 "common": [
1899 "src/core/NEON/kernels/NESelectKernel.cpp",
1900 "src/runtime/NEON/functions/NESelect.cpp"
Anton Vainer8a9a0fb2022-01-09 14:37:12 +02001901 ],
1902 "neon": {
1903 "common": [ "src/cpu/kernels/select/generic/neon/impl.cpp" ],
1904 "fp32": [ "src/cpu/kernels/select/generic/neon/fp32.cpp" ],
1905 "fp16": [ "src/cpu/kernels/select/generic/neon/fp16.cpp" ],
1906 "integer": [ "src/cpu/kernels/select/generic/neon/integer.cpp" ]
1907 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001908 }
1909 },
1910 "Slice": {
1911 "deps": [ "StridedSlice" ],
1912 "files": {
1913 "common": [ "src/runtime/NEON/functions/NESlice.cpp" ]
1914 }
1915 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001916 "Softmax": {
1917 "deps": [
1918 "Permute"
1919 ],
1920 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001921 "common": [
1922 "src/cpu/operators/CpuSoftmax.cpp",
1923 "src/cpu/kernels/CpuSoftmaxKernel.cpp",
1924 "src/runtime/NEON/functions/NESoftmaxLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001925 ],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02001926 "neon":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02001927 "common":["src/cpu/kernels/softmax/generic/neon/impl.cpp"],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02001928 "fp32": ["src/cpu/kernels/softmax/generic/neon/fp32.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001929 "fp16": ["src/cpu/kernels/softmax/generic/neon/fp16.cpp"],
1930 "qasymm8":[ "src/cpu/kernels/softmax/generic/neon/qasymm8.cpp"],
1931 "qasymm8_signed":["src/cpu/kernels/softmax/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02001932 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001933 "sve": {
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02001934 "common": [ "src/cpu/kernels/softmax/generic/sve/impl.cpp" ],
1935 "fp32": ["src/cpu/kernels/softmax/generic/sve/fp32.cpp"],
1936 "fp16": ["src/cpu/kernels/softmax/generic/sve/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001937 "qasymm8": ["src/cpu/kernels/softmax/generic/sve/qasymm8.cpp" ],
1938 "qasymm8_signed": ["src/cpu/kernels/softmax/generic/sve/qasymm8_signed.cpp"]
1939 },
1940 "sve2":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02001941 "common" :["src/cpu/kernels/softmax/generic/sve2/impl.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001942 "qasymm8":[ "src/cpu/kernels/softmax/generic/sve2/qasymm8.cpp"],
1943 "qasymm8_signed":["src/cpu/kernels/softmax/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001944 }
1945 }
1946 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001947 "SpaceToBatch": {
1948 "files": {
1949 "common": [
1950 "src/core/NEON/kernels/NESpaceToBatchLayerKernel.cpp",
1951 "src/runtime/NEON/functions/NESpaceToBatchLayer.cpp"
1952 ]
1953 }
1954 },
1955 "SpaceToDepth": {
1956 "files": {
1957 "common": [
1958 "src/core/NEON/kernels/NESpaceToDepthLayerKernel.cpp",
1959 "src/runtime/NEON/functions/NESpaceToDepthLayer.cpp"
1960 ]
1961 }
1962 },
1963 "Split": {
1964 "deps": [ "StridedSlice" ],
1965 "files": {
1966 "common": [
1967 "src/runtime/NEON/functions/NESplit.cpp"
1968 ]
1969 }
1970 },
1971 "Stack": {
1972 "files": {
1973 "common": [
1974 "src/core/NEON/kernels/NEStackLayerKernel.cpp",
1975 "src/runtime/NEON/functions/NEStackLayer.cpp"
1976 ]
1977 }
1978 },
1979 "StridedSlice": {
1980 "files": {
1981 "common": [
1982 "src/core/NEON/kernels/NEStridedSliceKernel.cpp",
1983 "src/runtime/NEON/functions/NEStridedSlice.cpp"
1984 ]
1985 }
1986 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001987 "Sub": {
1988 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001989 "common": [
1990 "src/cpu/operators/CpuSub.cpp",
1991 "src/cpu/kernels/CpuSubKernel.cpp",
Freddie Liardet487d3902021-09-21 12:36:43 +01001992 "src/runtime/NEON/functions/NEArithmeticSubtraction.cpp",
1993 "src/cpu/kernels/sub/neon/qasymm8.cpp",
1994 "src/cpu/kernels/sub/neon/qasymm8_signed.cpp",
1995 "src/cpu/kernels/sub/neon/qsymm16.cpp"
1996 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001997 }
1998 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001999 "Tile": {
2000 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002001 "common": [
2002 "src/core/NEON/kernels/NETileKernel.cpp",
2003 "src/runtime/NEON/functions/NETile.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002004 ]
2005 }
2006 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002007 "Transpose": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002008 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002009 "common": [
2010 "src/cpu/kernels/CpuTransposeKernel.cpp",
2011 "src/cpu/operators/CpuTranspose.cpp",
2012 "src/runtime/NEON/functions/NETranspose.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002013 ]
2014 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002015 },
2016 "Unstack": {
2017 "deps": [ "StridedSlice" ],
2018 "files": {
2019 "common": [ "src/runtime/NEON/functions/NEUnstack.cpp" ]
2020 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002021 }
2022 }
2023 }
Georgios Pinitasbdcdc392021-04-22 16:42:03 +01002024}