blob: 2a88aec37b91d4312de9f7b122cca33b411e5ad6 [file] [log] [blame]
Georgios Pinitasbdcdc392021-04-22 16:42:03 +01001{
Michalis Spyrou20fca522021-06-07 14:23:57 +01002 "common": [
3 "src/common/cpuinfo/CpuInfo.cpp",
4 "src/common/cpuinfo/CpuModel.cpp",
5 "src/common/cpuinfo/CpuIsaInfo.cpp",
6 "src/common/utils/LegacySupport.cpp",
7 "src/common/AllocatorWrapper.cpp",
8 "src/common/ITensorV2.cpp",
Georgios Pinitas41648142021-08-03 08:24:00 +01009 "src/common/TensorPack.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010010 "src/common/IOperator.cpp",
11 "src/core/AccessWindowAutoPadding.cpp",
12 "src/core/AccessWindowStatic.cpp",
13 "src/core/AccessWindowTranspose.cpp",
14 "src/core/Error.cpp",
15 "src/core/GPUTarget.cpp",
16 "src/core/Helpers.cpp",
17 "src/core/IAccessWindow.cpp",
18 "src/core/IKernel.cpp",
19 "src/core/ITensor.cpp",
20 "src/core/ITensorPack.cpp",
21 "src/core/Rounding.cpp",
22 "src/core/Size2D.cpp",
23 "src/core/SubTensorInfo.cpp",
24 "src/core/TensorInfo.cpp",
25 "src/core/Utils.cpp",
26 "src/core/Validate.cpp",
27 "src/core/Version.cpp",
28 "src/core/helpers/SoftmaxHelpers.cpp",
Anitha Rajb566b6e2023-08-23 11:40:06 +010029 "src/core/helpers/Utils.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010030 "src/core/helpers/WindowHelpers.cpp",
Matthew Bentham314d3e22023-06-23 10:53:52 +000031 "src/core/utils/ActivationFunctionUtils.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010032 "src/core/utils/AssemblyUtils.cpp",
Matthew Bentham314d3e22023-06-23 10:53:52 +000033 "src/core/utils/DataTypeUtils.cpp",
34 "src/core/utils/DataLayoutUtils.cpp",
35 "src/core/utils/InterpolationPolicyUtils.cpp",
36 "src/core/utils/FormatUtils.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010037 "src/core/utils/ScaleUtils.cpp",
Matthew Bentham314d3e22023-06-23 10:53:52 +000038 "src/core/utils/StringUtils.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010039 "src/core/utils/helpers/fft.cpp",
40 "src/core/utils/helpers/tensor_transform.cpp",
41 "src/core/utils/io/FileHandler.cpp",
42 "src/core/utils/misc/MMappedFile.cpp",
43 "src/core/utils/quantization/AsymmHelpers.cpp",
44 "src/core/CPP/CPPTypes.cpp",
45 "src/core/CPP/kernels/CPPBoxWithNonMaximaSuppressionLimitKernel.cpp",
46 "src/core/CPP/kernels/CPPNonMaximumSuppressionKernel.cpp",
47 "src/core/CPP/kernels/CPPPermuteKernel.cpp",
48 "src/core/CPP/kernels/CPPTopKVKernel.cpp",
49 "src/core/CPP/kernels/CPPUpsampleKernel.cpp",
50 "src/runtime/Allocator.cpp",
51 "src/runtime/BlobLifetimeManager.cpp",
52 "src/runtime/BlobMemoryPool.cpp",
53 "src/runtime/ISimpleLifetimeManager.cpp",
54 "src/runtime/ITensorAllocator.cpp",
55 "src/runtime/IWeightsManager.cpp",
56 "src/runtime/IScheduler.cpp",
57 "src/runtime/Memory.cpp",
58 "src/runtime/MemoryManagerOnDemand.cpp",
59 "src/runtime/OffsetLifetimeManager.cpp",
60 "src/runtime/OffsetMemoryPool.cpp",
61 "src/runtime/OperatorTensor.cpp",
62 "src/runtime/PoolManager.cpp",
63 "src/runtime/RuntimeContext.cpp",
64 "src/runtime/Scheduler.cpp",
65 "src/runtime/SchedulerFactory.cpp",
66 "src/runtime/SchedulerUtils.cpp",
67 "src/runtime/SubTensor.cpp",
68 "src/runtime/Tensor.cpp",
69 "src/runtime/TensorAllocator.cpp",
70 "src/runtime/Utils.cpp",
71 "src/runtime/CPP/ICPPSimpleFunction.cpp",
72 "src/runtime/CPP/functions/CPPBoxWithNonMaximaSuppressionLimit.cpp",
73 "src/runtime/CPP/functions/CPPDetectionOutputLayer.cpp",
74 "src/runtime/CPP/functions/CPPDetectionPostProcessLayer.cpp",
75 "src/runtime/CPP/functions/CPPNonMaximumSuppression.cpp",
76 "src/runtime/CPP/functions/CPPPermute.cpp",
77 "src/runtime/CPP/functions/CPPTopKV.cpp",
78 "src/runtime/CPP/functions/CPPUpsample.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +010079 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +010080 "logging": [
81 "src/core/utils/logging/FilePrinter.cpp",
82 "src/core/utils/logging/Helpers.cpp",
83 "src/core/utils/logging/Logger.cpp",
84 "src/core/utils/logging/LoggerRegistry.cpp"
85 ],
86 "scheduler": {
87 "single": [ "src/runtime/CPP/SingleThreadScheduler.cpp" ],
88 "threads": [ "src/runtime/CPP/CPPScheduler.cpp" ],
89 "omp": [ "src/runtime/OMP/OMPScheduler.cpp"]
90 },
Michalis Spyrou20fca522021-06-07 14:23:57 +010091 "c_api": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +010092 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +010093 "src/c/AclContext.cpp",
Georgios Pinitas06ac6e42021-07-05 08:08:52 +010094 "src/c/AclOperator.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +010095 "src/c/AclQueue.cpp",
96 "src/c/AclTensor.cpp",
97 "src/c/AclTensorPack.cpp",
98 "src/c/AclVersion.cpp"
Georgios Pinitasbdcdc392021-04-22 16:42:03 +010099 ],
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100100 "cpu": [
101 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100102 "gpu": [
103 "src/c/cl/AclOpenClExt.cpp"
Georgios Pinitas41648142021-08-03 08:24:00 +0100104 ],
105 "operators":
106 [
107 "src/c/operators/AclActivation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100108 ]
109 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100110 "high_priority": [
111 "Activation",
112 "DepthwiseConv2d",
113 "Conv2d",
114 "Permute",
115 "Pool2d",
SiCong Li83d06742023-05-11 11:54:22 +0100116 "Reshape",
117 "MatMul"
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100118 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100119 "gpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100120 "common": [
121 "src/core/CL/CLCompileContext.cpp",
Giorgio Arenaba2dd822021-07-28 16:10:03 +0100122 "src/core/CL/DefaultLWSHeuristics.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100123 "src/core/CL/CLHelpers.cpp",
124 "src/core/CL/CLKernelLibrary.cpp",
125 "src/core/CL/CLUtils.cpp",
126 "src/core/CL/ICLKernel.cpp",
127 "src/core/CL/ICLSimple2DKernel.cpp",
128 "src/core/CL/ICLSimple3DKernel.cpp",
129 "src/core/CL/ICLSimpleKernel.cpp",
130 "src/core/CL/ICLTensor.cpp",
131 "src/core/CL/OpenCL.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100132 "src/gpu/cl/ClContext.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100133 "src/gpu/cl/ClKernelLibrary.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100134 "src/gpu/cl/ClQueue.cpp",
135 "src/gpu/cl/ClTensor.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100136 "src/core/CL/kernels/CLFillBorderKernel.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100137 "src/runtime/CL/CLBufferAllocator.cpp",
138 "src/runtime/CL/CLGEMMHeuristicsHandle.cpp",
139 "src/runtime/CL/CLHelpers.cpp",
140 "src/runtime/CL/CLMemory.cpp",
141 "src/runtime/CL/CLMemoryRegion.cpp",
142 "src/runtime/CL/CLOperator.cpp",
143 "src/runtime/CL/CLRuntimeContext.cpp",
144 "src/runtime/CL/CLScheduler.cpp",
145 "src/runtime/CL/CLSubTensor.cpp",
146 "src/runtime/CL/CLTensor.cpp",
147 "src/runtime/CL/CLTensorAllocator.cpp",
148 "src/runtime/CL/CLTuner.cpp",
149 "src/runtime/CL/ICLSimpleFunction.cpp",
150 "src/runtime/CL/Utils.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100151 "src/runtime/CL/mlgo/HeuristicTree.cpp",
152 "src/runtime/CL/mlgo/MLGOHeuristics.cpp",
153 "src/runtime/CL/mlgo/MLGOParser.cpp",
154 "src/runtime/CL/mlgo/Utils.cpp",
155 "src/runtime/CL/tuners/CLTuningParametersList.cpp"
156 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100157 "operators": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100158 "Activation":{
159 "files": {
160 "common": [
161 "src/gpu/cl/kernels/ClActivationKernel.cpp",
162 "src/gpu/cl/operators/ClActivation.cpp",
163 "src/runtime/CL/functions/CLActivationLayer.cpp"
164 ]
165 }
166 },
167 "ArgMinMax": {
168 "deps": [ "Reshape" ],
169 "files": {
170 "common": [
171 "src/core/CL/kernels/CLArgMinMaxLayerKernel.cpp",
172 "src/runtime/CL/functions/CLArgMinMaxLayer.cpp"
173 ]
174 }
175 },
176 "Add": {
177 "files": {
178 "common": [
179 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
180 "src/gpu/cl/operators/ClAdd.cpp"
181 ]
182 }
183 },
184 "BatchNormalization": {
185 "files": {
186 "common": [
187 "src/core/CL/kernels/CLBatchNormalizationLayerKernel.cpp",
188 "src/core/CL/kernels/CLFuseBatchNormalizationKernel.cpp",
189 "src/runtime/CL/functions/CLBatchNormalizationLayer.cpp",
190 "src/runtime/CL/functions/CLFuseBatchNormalization.cpp"
191 ]
192 }
193 },
194 "BatchToSpace": {
195 "files": {
196 "common": [
197 "src/core/CL/kernels/CLBatchToSpaceLayerKernel.cpp",
198 "src/runtime/CL/functions/CLBatchToSpaceLayer.cpp"
199 ]
200 }
201 },
202 "Bitwise": {
203 "files": {
204 "common": [ "src/core/CL/kernels/CLBitwiseKernel.cpp" ]
205 }
206 },
207 "BitwiseAnd": {
208 "deps": [ "Bitwise" ],
209 "files": {
210 "common": [ "src/runtime/CL/functions/CLBitwiseAnd.cpp" ]
211 }
212 },
213 "BitwiseNot": {
214 "deps": [ "Bitwise" ],
215 "files": {
216 "common": [ "src/runtime/CL/functions/CLBitwiseNot.cpp" ]
217 }
218 },
219 "BitwiseOr": {
220 "deps": [ "Bitwise" ],
221 "files": {
222 "common": [ "src/runtime/CL/functions/CLBitwiseOr.cpp" ]
223 }
224 },
225 "BitwiseXor": {
226 "deps": [ "Bitwise" ],
227 "files": {
228 "common": [ "src/runtime/CL/functions/CLBitwiseXor.cpp" ]
229 }
230 },
231 "BoundingBoxTransform": {
232 "files": {
233 "common": [
234 "src/core/CL/kernels/CLBoundingBoxTransformKernel.cpp",
235 "src/runtime/CL/functions/CLBoundingBoxTransform.cpp"
236 ]
237 }
238 },
239 "Cast": {
240 "files": {
241 "common": [
242 "src/gpu/cl/kernels/ClCastKernel.cpp",
243 "src/gpu/cl/operators/ClCast.cpp",
244 "src/runtime/CL/functions/CLCast.cpp"
245 ]
246 }
247 },
248 "ChannelShuffle": {
249 "files": {
250 "common": [
251 "src/core/CL/kernels/CLChannelShuffleLayerKernel.cpp",
252 "src/runtime/CL/functions/CLChannelShuffleLayer.cpp"
253 ]
254 }
255 },
256 "Comparison": {
257 "files": {
258 "common": [
259 "src/core/CL/kernels/CLComparisonKernel.cpp",
260 "src/runtime/CL/functions/CLComparison.cpp"
261 ]
262 }
263 },
264 "Concatenate": {
265 "files": {
266 "common": [
267 "src/gpu/cl/kernels/ClBatchConcatenateKernel.cpp",
268 "src/gpu/cl/kernels/ClDepthConcatenateKernel.cpp",
269 "src/gpu/cl/kernels/ClHeightConcatenateKernel.cpp",
270 "src/gpu/cl/kernels/ClWidthConcatenate2TensorsKernel.cpp",
271 "src/gpu/cl/kernels/ClWidthConcatenate4TensorsKernel.cpp",
272 "src/gpu/cl/kernels/ClWidthConcatenateKernel.cpp",
273 "src/gpu/cl/operators/ClConcatenate.cpp",
274 "src/runtime/CL/functions/CLConcatenateLayer.cpp"
275 ]
276 }
277 },
278 "Conv2d": {
279 "deps": [
280 "Activation",
281 "ElementwiseBinary",
282 "FFT2D",
283 "Gemm",
284 "Mul",
285 "Pad",
286 "Permute",
287 "Reduction",
288 "Reshape",
289 "Reverse",
290 "Slice"
291 ],
292 "files": {
293 "common": [
294 "src/gpu/cl/kernels/ClDirectConv2dKernel.cpp",
295 "src/gpu/cl/kernels/ClWinogradFilterTransformKernel.cpp",
296 "src/gpu/cl/kernels/ClWinogradInputTransformKernel.cpp",
297 "src/gpu/cl/kernels/ClWinogradOutputTransformKernel.cpp",
298 "src/gpu/cl/kernels/ClIm2ColKernel.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000299 "src/gpu/cl/kernels/ClIndirectConv2dKernel.cpp",
Gian Marco Iodice5d016812022-11-17 11:03:39 +0000300 "src/gpu/cl/kernels/ClIndirectConv2dAddressPrecalculationKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100301 "src/gpu/cl/kernels/ClCol2ImKernel.cpp",
302 "src/gpu/cl/operators/ClConv2d.cpp",
303 "src/gpu/cl/operators/ClDirectConv2d.cpp",
304 "src/gpu/cl/operators/ClGemmConv2d.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000305 "src/gpu/cl/operators/ClIndirectConv2d.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100306 "src/gpu/cl/operators/ClWinogradConv2d.cpp",
307 "src/gpu/cl/kernels/ClWeightsReshapeKernel.cpp",
308 "src/runtime/CL/functions/CLConvolutionLayer.cpp",
309 "src/runtime/CL/functions/CLDirectConvolutionLayer.cpp",
310 "src/runtime/CL/functions/CLFFTConvolutionLayer.cpp",
311 "src/runtime/CL/functions/CLGEMMConvolutionLayer.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000312 "src/runtime/CL/functions/CLIndirectConvolutionLayer.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100313 "src/runtime/CL/functions/CLWinogradConvolutionLayer.cpp"
314 ]
315 }
316 },
Giorgio Arena273c28c2021-10-14 15:59:15 +0100317 "Conv3d": {
318 "files": {
319 "common": [
320 "src/gpu/cl/kernels/ClDirectConv3dKernel.cpp",
321 "src/gpu/cl/operators/ClDirectConv3d.cpp",
322 "src/runtime/CL/functions/CLConv3D.cpp"
323 ]
324 }
325 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100326 "Copy": {
327 "files": {
328 "common": [
329 "src/gpu/cl/kernels/ClCopyKernel.cpp",
330 "src/gpu/cl/operators/ClCopy.cpp",
331 "src/runtime/CL/functions/CLCopy.cpp"
332 ]
333 }
334 },
335 "CropResize": {
336 "deps": [ "Copy", "Fill", "Scale" ],
337 "files": {
338 "common": [
339 "src/gpu/cl/kernels/ClCropKernel.cpp",
340 "src/gpu/cl/operators/ClCrop.cpp",
341 "src/runtime/CL/functions/CLCrop.cpp",
342 "src/runtime/CL/functions/CLCropResize.cpp"
343 ]
344 }
345 },
346 "Deconv2d": {
347 "deps": [ "Conv2d", "Reverse", "Transpose"],
348 "files": {
349 "common": [
350 "src/core/CL/kernels/CLDeconvolutionLayerUpsampleKernel.cpp",
351 "src/core/CL/kernels/CLDeconvolutionReshapeOutputKernel.cpp",
Gunes Bayirec0113d2022-11-09 09:26:27 +0000352 "src/gpu/cl/kernels/ClTransposedConvolutionKernel.cpp",
353 "src/gpu/cl/operators/ClTransposedConvolution.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100354 "src/runtime/CL/functions/CLDeconvolutionLayer.cpp",
355 "src/runtime/CL/functions/CLDeconvolutionLayerUpsample.cpp",
356 "src/runtime/CL/functions/CLDirectDeconvolutionLayer.cpp",
357 "src/runtime/CL/functions/CLGEMMDeconvolutionLayer.cpp"
358 ]
359 }
360 },
361 "DepthConvert": {
362 "deps": [ "Cast"],
363 "files": {
364 "common": [ "src/runtime/CL/functions/CLDepthConvertLayer.cpp" ]
365 }
366 },
367 "DepthToSpace": {
368 "files": {
369 "common": [
370 "src/core/CL/kernels/CLDepthToSpaceLayerKernel.cpp",
371 "src/runtime/CL/functions/CLDepthToSpaceLayer.cpp"
372 ]
373 }
374 },
375 "DepthwiseConv2d": {
376 "deps": [ "Permute" ],
377 "files": {
378 "common": [
379 "src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp",
380 "src/runtime/CL/functions/CLDepthwiseConvolutionLayer.cpp"
381 ]
382 }
383 },
384 "Dequantize": {
385 "files": {
386 "common": [
387 "src/gpu/cl/kernels/ClDequantizeKernel.cpp",
388 "src/gpu/cl/operators/ClDequantize.cpp",
389 "src/runtime/CL/functions/CLDequantizationLayer.cpp"
390 ]
391 }
392 },
393 "ElementwiseBinary": {
394 "deps": ["Add", "Sub"],
395 "files": {
396 "common": [
397 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
398 "src/gpu/cl/operators/ClElementwiseOperations.cpp",
399 "src/runtime/CL/functions/CLElementwiseOperations.cpp"
400 ]
401 }
402 },
403 "ElementwiseUnary":{
404 "files": {
405 "common": [
406 "src/gpu/cl/kernels/ClElementwiseUnaryKernel.cpp",
407 "src/gpu/cl/operators/ClElementwiseUnary.cpp",
408 "src/runtime/CL/functions/CLElementwiseUnaryLayer.cpp"
409 ]
410 }
411 },
412 "FFT1D": {
413 "files": {
414 "common": [
415 "src/core/CL/kernels/CLFFTDigitReverseKernel.cpp",
416 "src/core/CL/kernels/CLFFTRadixStageKernel.cpp",
417 "src/core/CL/kernels/CLFFTScaleKernel.cpp",
418 "src/runtime/CL/functions/CLFFT1D.cpp"
419 ]
420 }
421 },
422 "FFT2D": {
423 "deps": [ "FFT1D" ],
424 "files": {
425 "common": [ "src/runtime/CL/functions/CLFFT2D.cpp" ]
426 }
427 },
428 "Fill": {
429 "files": {
430 "common": [
431 "src/gpu/cl/kernels/ClFillKernel.cpp",
432 "src/gpu/cl/operators/ClFill.cpp",
433 "src/runtime/CL/functions/CLFill.cpp"
434 ]
435 }
436 },
437 "Flatten": {
438 "files": {
439 "common": [
440 "src/gpu/cl/operators/ClFlatten.cpp",
441 "src/runtime/CL/functions/CLFlattenLayer.cpp"
442 ]
443 }
444 },
445 "Floor": {
446 "files": {
447 "common": [
448 "src/gpu/cl/kernels/ClFloorKernel.cpp",
449 "src/gpu/cl/operators/ClFloor.cpp",
450 "src/runtime/CL/functions/CLFloor.cpp"
451 ]
452 }
453 },
454 "FullyConnected": {
455 "deps": [ "Flatten", "Gemm", "Transpose"],
456 "files": {
457 "common": [
458 "src/gpu/cl/kernels/ClConvertFullyConnectedWeightsKernel.cpp",
459 "src/gpu/cl/operators/ClConvertFullyConnectedWeights.cpp",
460 "src/gpu/cl/operators/ClFullyConnected.cpp",
461 "src/runtime/CL/functions/CLConvertFullyConnectedWeights.cpp",
462 "src/runtime/CL/functions/CLFullyConnectedLayer.cpp"
463 ]
464 }
465 },
466 "Gather": {
467 "files": {
468 "common": [
469 "src/core/CL/kernels/CLGatherKernel.cpp",
470 "src/runtime/CL/functions/CLGather.cpp"]
471 }
472 },
473 "Gemm": {
474 "deps": [ "Cast" ],
475 "files": {
476 "common": [
477 "src/gpu/cl/kernels/gemm/ClGemmHelpers.cpp",
478 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeBifrost.cpp",
479 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeMidgard.cpp",
480 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeValhall.cpp",
481 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedBifrost.cpp",
482 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedValhall.cpp",
483 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyBifrost.cpp",
484 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyValhall.cpp",
485 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyNativeKernel.cpp",
486 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedKernel.cpp",
487 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsKernel.cpp",
Freddie Liardete572dff2022-05-16 14:09:10 +0100488 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100489 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionKernel.cpp",
490 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionOutputStageKernel.cpp",
491 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFixedPointKernel.cpp",
492 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFloatKernel.cpp",
493 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100494 "src/gpu/cl/kernels/ClGemmMatrixMultiplyNativeKernel.cpp",
Gunes Bayir4bfc70e2021-12-10 16:17:56 +0000495 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100496 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedKernel.cpp",
497 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsKernel.cpp",
498 "src/gpu/cl/kernels/ClGemmReshapeLhsMatrixKernel.cpp",
499 "src/gpu/cl/kernels/ClGemmReshapeRhsMatrixKernel.cpp",
500 "src/gpu/cl/kernels/ClGemmLowpReductionKernel.cpp",
501 "src/gpu/cl/operators/ClGemm.cpp",
502 "src/gpu/cl/operators/ClGemmLowpMatrixMultiplyCore.cpp",
503 "src/gpu/cl/operators/ClGemmLowpOutputStage.cpp",
504 "src/runtime/CL/gemm/CLGEMMDefaultTypeBifrost.cpp",
505 "src/runtime/CL/gemm/CLGEMMDefaultTypeMidgard.cpp",
506 "src/runtime/CL/gemm/CLGEMMDefaultTypeValhall.cpp",
507 "src/runtime/CL/gemm_auto_heuristics/CLGEMMAutoHeuristics.cpp",
508 "src/runtime/CL/functions/CLGEMM.cpp",
509 "src/runtime/CL/functions/CLGEMMLowpMatrixMultiplyCore.cpp",
Ramy Elgammaldf6a3b02022-11-30 16:23:10 +0000510 "src/runtime/CL/functions/CLGEMMLowpOutputStage.cpp",
511 "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigBifrost.cpp",
Gian Marco Iodicea5cb79f2022-12-28 13:53:51 +0000512 "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigValhall.cpp",
Gian Marco Iodice9d3bd412022-12-30 09:45:00 +0000513 "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigBifrost.cpp",
514 "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigValhall.cpp",
515 "src/runtime/heuristics/dwc_native/ClDWCNativeHeuristicsHelpers.cpp",
Ramy Elgammal34a95d12023-05-11 18:23:44 +0100516 "src/runtime/heuristics/indirect_conv/ClIndirectConvDefaultConfigValhall.cpp"
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100517 ]
518 }
519 },
Ramy Elgammal2b6ebfe2023-03-09 21:15:37 +0000520 "MatMul": {
521 "files": {
522 "common": [
Gunes Bayir9d0c4de2023-04-13 18:22:58 +0100523 "src/gpu/cl/kernels/ClMatMulLowpNativeKernel.cpp",
Gunes Bayire87fa662023-09-07 12:20:33 +0100524 "src/gpu/cl/kernels/ClMatMulLowpNativeMMULKernel.cpp",
Jakub Sujak1ed6a142023-04-13 21:14:42 +0100525 "src/gpu/cl/kernels/ClMatMulNativeKernel.cpp",
SiCong Lia8d80582023-05-19 14:23:37 +0100526 "src/gpu/cl/kernels/ClMatMulNativeMMULKernel.cpp",
Gunes Bayire87fa662023-09-07 12:20:33 +0100527 "src/gpu/cl/kernels/helpers/MatMulKernelHelpers.cpp",
Ramy Elgammalf26ea2f2023-03-24 11:42:03 +0000528 "src/gpu/cl/operators/ClMatMul.cpp",
Ramy Elgammal34a95d12023-05-11 18:23:44 +0100529 "src/runtime/CL/functions/CLMatMul.cpp",
530 "src/runtime/heuristics/matmul_native/ClMatMulNativeDefaultConfigValhall.cpp",
531 "src/runtime/heuristics/matmul_native/ClMatMulNativeHelpers.cpp"
Ramy Elgammal2b6ebfe2023-03-09 21:15:37 +0000532 ]
533 }
534 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100535 "GenerateProposals": {
536 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
537 "files": {
538 "common": [
539 "src/core/CL/kernels/CLGenerateProposalsLayerKernel.cpp",
540 "src/runtime/CL/functions/CLGenerateProposalsLayer.cpp"
541 ]
542 }
543 },
544 "InstanceNormalize": {
545 "files": {
546 "common": [
547 "src/core/CL/kernels/CLInstanceNormalizationLayerKernel.cpp",
548 "src/runtime/CL/functions/CLInstanceNormalizationLayer.cpp"
549 ]
550 }
551 },
552 "L2Normalize": {
553 "deps": [ "Reduction" ],
554 "files": {
555 "common": [
556 "src/core/CL/kernels/CLL2NormalizeLayerKernel.cpp",
557 "src/runtime/CL/functions/CLL2NormalizeLayer.cpp"
558 ]
559 }
560 },
561 "Logical": {
562 "files": {
563 "common": [
564 "src/gpu/cl/operators/ClLogicalNot.cpp",
565 "src/runtime/CL/functions/CLLogicalAnd.cpp",
566 "src/runtime/CL/functions/CLLogicalNot.cpp",
567 "src/runtime/CL/functions/CLLogicalOr.cpp"
568 ]
569 }
570 },
571 "LSTM": {
572 "deps": [
573 "Activation",
574 "Concatenate",
575 "Copy",
576 "Dequantize",
577 "ElementwiseBinary",
578 "Fill",
579 "FullyConnected",
580 "Gemm",
581 "MeanStdDevNormalize",
582 "Mul",
583 "Quantize",
584 "Slice",
585 "Transpose"
586 ],
587 "files": {
588 "common": [
589 "src/core/CL/kernels/CLQLSTMLayerNormalizationKernel.cpp",
590 "src/runtime/CL/functions/CLQLSTMLayer.cpp",
591 "src/runtime/CL/functions/CLLSTMLayer.cpp",
592 "src/runtime/CL/functions/CLLSTMLayerQuantized.cpp"
593 ]
594 }
595 },
596 "MaxUnpool2d": {
597 "deps": [ "Fill" ],
598 "files": {
599 "common": [
600 "src/core/CL/kernels/CLMaxUnpoolingLayerKernel.cpp",
601 "src/runtime/CL/functions/CLMaxUnpoolingLayer.cpp"
602 ]
603 }
604 },
605 "MeanStdDevNormalize": {
606 "deps": [ "Reduction" ],
607 "files": {
608 "common": [
609 "src/core/CL/kernels/CLMeanStdDevNormalizationKernel.cpp",
610 "src/runtime/CL/functions/CLMeanStdDevNormalizationLayer.cpp",
611 "src/runtime/CL/functions/CLReduceMean.cpp"
612 ]
613 }
614 },
615 "Mul": {
616 "files": {
617 "common": [
618 "src/gpu/cl/kernels/ClMulKernel.cpp",
619 "src/gpu/cl/operators/ClMul.cpp",
620 "src/runtime/CL/functions/CLPixelWiseMultiplication.cpp"
621 ]
622 }
623 },
624 "Normalize": {
625 "files": {
626 "common": [
627 "src/core/CL/kernels/CLNormalizationLayerKernel.cpp",
628 "src/runtime/CL/functions/CLNormalizationLayer.cpp"
629 ]
630 }
631 },
632 "Pad": {
633 "deps": [ "Copy" ],
634 "files": {
635 "common": [
636 "src/core/CL/kernels/CLPadLayerKernel.cpp",
637 "src/runtime/CL/functions/CLPadLayer.cpp"
638 ]
639 }
640 },
641 "Permute": {
642 "files": {
643 "common": [
644 "src/gpu/cl/kernels/ClPermuteKernel.cpp",
645 "src/gpu/cl/operators/ClPermute.cpp",
646 "src/runtime/CL/functions/CLPermute.cpp"
647 ]
648 }
649 },
650 "Pool2d": {
651 "files": {
652 "common": [
653 "src/gpu/cl/kernels/ClPool2dKernel.cpp",
654 "src/gpu/cl/operators/ClPool2d.cpp",
655 "src/runtime/CL/functions/CLPoolingLayer.cpp"
656 ]
657 }
658 },
ramelg0137515692022-02-26 22:06:20 +0000659 "Pool3d": {
660 "files": {
661 "common": [
662 "src/gpu/cl/kernels/ClPool3dKernel.cpp",
663 "src/gpu/cl/operators/ClPool3d.cpp",
664 "src/runtime/CL/functions/CLPooling3dLayer.cpp"
665 ]
666 }
667 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100668 "PRelu": {
669 "deps": [ "ElementwiseBinary" ],
670 "files": {
671 "common": [
672 "src/gpu/cl/operators/ClPRelu.cpp",
673 "src/runtime/CL/functions/CLPReluLayer.cpp"
674 ]
675 }
676 },
677 "PriorBox": {
678 "files": {
679 "common": [
680 "src/core/CL/kernels/CLPriorBoxLayerKernel.cpp",
681 "src/runtime/CL/functions/CLPriorBoxLayer.cpp"
682 ]
683 }
684 },
685 "Quantize": {
686 "files": {
687 "common": [
688 "src/gpu/cl/kernels/ClQuantizeKernel.cpp",
689 "src/gpu/cl/operators/ClQuantize.cpp",
690 "src/runtime/CL/functions/CLQuantizationLayer.cpp"
691 ]
692 }
693 },
694 "Range": {
695 "files": {
696 "common": [
697 "src/core/CL/kernels/CLRangeKernel.cpp",
698 "src/runtime/CL/functions/CLRange.cpp"
699 ]
700 }
701 },
702 "Reduction": {
703 "deps": [ "Reshape" ],
704 "files": {
ramelg01a1f78512022-06-29 16:28:10 +0100705 "common": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100706 "src/core/CL/kernels/CLReductionOperationKernel.cpp",
707 "src/runtime/CL/functions/CLReductionOperation.cpp"
708 ]
709 }
710 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100711 "Reorg": {
712 "files": {
713 "common": [
714 "src/core/CL/kernels/CLReorgLayerKernel.cpp",
715 "src/runtime/CL/functions/CLReorgLayer.cpp"
716 ]
717 }
718 },
719 "Reshape": {
720 "files": {
721 "common": [
722 "src/gpu/cl/kernels/ClReshapeKernel.cpp",
723 "src/gpu/cl/operators/ClReshape.cpp",
724 "src/runtime/CL/functions/CLReshapeLayer.cpp"
725 ]
726 }
727 },
728 "Reverse": {
729 "files": {
730 "common": [
731 "src/core/CL/kernels/CLReverseKernel.cpp",
732 "src/runtime/CL/functions/CLReverse.cpp"
733 ]
734 }
735 },
736 "RNN": {
737 "deps": [ "Activation", "Cast", "ElementwiseBinary", "FullyConnected", "Gemm"],
738 "files": {
739 "common": [ "src/runtime/CL/functions/CLRNNLayer.cpp" ]
740 }
741 },
742 "ROIAlign": {
743 "files": {
744 "common": [
745 "src/core/CL/kernels/CLROIAlignLayerKernel.cpp",
746 "src/runtime/CL/functions/CLROIAlignLayer.cpp"
747 ]
748 }
749 },
750 "ROIPool2d": {
751 "files": {
752 "common": [
753 "src/core/CL/kernels/CLROIPoolingLayerKernel.cpp",
754 "src/runtime/CL/functions/CLROIPoolingLayer.cpp"
755 ]
756 }
757 },
758 "Scale": {
759 "files": {
760 "common": [
761 "src/gpu/cl/kernels/ClScaleKernel.cpp",
762 "src/gpu/cl/operators/ClScale.cpp",
763 "src/runtime/CL/functions/CLScale.cpp"
764 ]
765 }
766 },
767 "Select": {
768 "files": {
769 "common": [
770 "src/core/CL/kernels/CLSelectKernel.cpp",
771 "src/runtime/CL/functions/CLSelect.cpp"
772 ]
773 }
774 },
775 "Slice": {
776 "deps": [ "StridedSlice" ],
777 "files": {
778 "common": [ "src/runtime/CL/functions/CLSlice.cpp" ]
779 }
780 },
781 "Softmax": {
782 "deps": [ "Permute" ],
783 "files": {
784 "common": [
785 "src/gpu/cl/kernels/ClSoftmaxKernel.cpp",
786 "src/gpu/cl/operators/ClSoftmax.cpp",
787 "src/runtime/CL/functions/CLSoftmaxLayer.cpp"
788 ]
789 }
790 },
791 "SpaceToBatch": {
792 "files": {
793 "common": [
794 "src/core/CL/kernels/CLSpaceToBatchLayerKernel.cpp",
795 "src/runtime/CL/functions/CLSpaceToBatchLayer.cpp"
796 ]
797 }
798 },
799 "SpaceToDepth": {
800 "files": {
801 "common": [
802 "src/core/CL/kernels/CLSpaceToDepthLayerKernel.cpp",
803 "src/runtime/CL/functions/CLSpaceToDepthLayer.cpp"
804 ]
805 }
806 },
807 "Split": {
808 "deps": [ "StridedSlice" ],
809 "files": {
810 "common": [ "src/runtime/CL/functions/CLSplit.cpp" ]
811 }
812 },
813 "Stack": {
814 "files": {
815 "common": [
816 "src/core/CL/kernels/CLStackLayerKernel.cpp",
817 "src/runtime/CL/functions/CLStackLayer.cpp"
818 ]
819 }
820 },
821 "StridedSlice": {
822 "files": {
823 "common": [
824 "src/core/CL/kernels/CLStridedSliceKernel.cpp",
825 "src/runtime/CL/functions/CLStridedSlice.cpp"
826 ]
827 }
828 },
829 "Sub": {
830 "files": {
831 "common": [
832 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
833 "src/gpu/cl/operators/ClSub.cpp"
834 ]
835 }
836 },
837 "Tile": {
838 "files": {
839 "common": [
840 "src/core/CL/kernels/CLTileKernel.cpp",
841 "src/runtime/CL/functions/CLTile.cpp"
842 ]
843 }
844 },
845 "Transpose": {
846 "files": {
847 "common": [
848 "src/gpu/cl/kernels/ClTransposeKernel.cpp",
849 "src/gpu/cl/operators/ClTranspose.cpp",
850 "src/runtime/CL/functions/CLTranspose.cpp"
851 ]
852 }
853 },
854 "Unstack": {
855 "deps": [ "StridedSlice" ],
856 "files": {
857 "common": [ "src/runtime/CL/functions/CLUnstack.cpp" ]
858 }
859 },
860 "YUVNormalize": {
861 "files": {
862 "common": [
863 "src/core/CL/kernels/CLNormalizePlanarYUVLayerKernel.cpp",
864 "src/runtime/CL/functions/CLNormalizePlanarYUVLayer.cpp"
865 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100866 }
Georgios Pinitasbdcdc392021-04-22 16:42:03 +0100867 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100868 }
869},
Michalis Spyrou20fca522021-06-07 14:23:57 +0100870 "cpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100871 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +0100872 "src/cpu/CpuContext.cpp",
873 "src/cpu/CpuQueue.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100874 "src/cpu/CpuTensor.cpp",
875 "src/core/NEON/kernels/NEFillBorderKernel.cpp",
876 "src/runtime/NEON/INEOperator.cpp",
877 "src/runtime/NEON/INESimpleFunction.cpp",
878 "src/runtime/NEON/INESimpleFunctionNoBorder.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100879 ],
880 "operators": {
881 "Activation": {
Viet-Hoa Dofd472f02023-03-15 14:05:06 +0000882 "deps": [ "LUT" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100883 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100884 "common": [
885 "src/cpu/operators/CpuActivation.cpp",
886 "src/cpu/kernels/CpuActivationKernel.cpp",
Dana Zlotnika538ae52022-02-21 13:12:41 +0200887 "src/runtime/NEON/functions/NEActivationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100888 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100889 "neon": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200890 "fp16": [ "src/cpu/kernels/activation/generic/neon/fp16.cpp" ],
ramelg01c827e992022-04-08 03:52:28 +0100891 "fp32": [ "src/cpu/kernels/activation/generic/neon/fp32.cpp" ],
Viet-Hoa Do29db3d22022-08-10 11:56:49 +0100892 "qasymm8": [
893 "src/cpu/kernels/activation/generic/neon/qasymm8.cpp",
894 "src/cpu/kernels/activation/generic/neon/lut.cpp"
895 ],
896 "qasymm8_signed": [
897 "src/cpu/kernels/activation/generic/neon/qasymm8_signed.cpp",
898 "src/cpu/kernels/activation/generic/neon/lut.cpp"
899 ],
Dana Zlotnika538ae52022-02-21 13:12:41 +0200900 "qsymm16": [ "src/cpu/kernels/activation/generic/neon/qsymm16.cpp" ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100901 },
902 "sve": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200903 "fp16": [ "src/cpu/kernels/activation/generic/sve/fp16.cpp" ],
SiCong Lic0463a22023-05-17 13:46:13 +0100904 "fp32": [ "src/cpu/kernels/activation/generic/sve/fp32.cpp" ]
ramelg01c827e992022-04-08 03:52:28 +0100905 },
alerah01c9e519d2022-01-31 19:04:10 +0200906 "sve2":{
SiCong Lic0463a22023-05-17 13:46:13 +0100907 "qasymm8": [
908 "src/cpu/kernels/activation/generic/sve2/qasymm8.cpp",
909 "src/cpu/kernels/activation/generic/sve2/lut.cpp"
910 ],
Dana Zlotnik32291712021-11-25 09:58:27 +0200911 "qasymm8_signed": [ "src/cpu/kernels/activation/generic/sve2/qasymm8_signed.cpp" ],
912 "qsymm16": [ "src/cpu/kernels/activation/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100913 }
914 }
915 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100916 "ArgMinMax": {
917 "deps": [ "Reduction" ],
918 "files": {
919 "common": [ "src/runtime/NEON/functions/NEArgMinMaxLayer.cpp" ]
920 }
921 },
Michalis Spyrou20fca522021-06-07 14:23:57 +0100922 "Add": {
923 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100924 "common": [
925 "src/cpu/operators/CpuAdd.cpp",
926 "src/cpu/kernels/CpuAddKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200927 "src/runtime/NEON/functions/NEArithmeticAddition.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100928 ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200929 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200930 "common": ["src/cpu/kernels/add/generic/neon/impl.cpp"],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200931 "fp32":["src/cpu/kernels/add/generic/neon/fp32.cpp"],
932 "fp16":["src/cpu/kernels/add/generic/neon/fp16.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200933 "integer":["src/cpu/kernels/add/generic/neon/integer.cpp"],
934 "qasymm8": ["src/cpu/kernels/add/generic/neon/qasymm8.cpp"],
935 "qasymm8_signed": ["src/cpu/kernels/add/generic/neon/qasymm8_signed.cpp"],
936 "qsymm16": ["src/cpu/kernels/add/generic/neon/qsymm16.cpp"]
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200937 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100938 "sve": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200939 "common": [ "src/cpu/kernels/add/generic/sve/impl.cpp" ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200940 "integer":["src/cpu/kernels/add/generic/sve/integer.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200941 "fp32":["src/cpu/kernels/add/generic/sve/fp32.cpp"],
942 "fp16":["src/cpu/kernels/add/generic/sve/fp16.cpp"]
943 },
944 "sve2": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200945 "qasymm8": [ "src/cpu/kernels/add/generic/sve2/qasymm8.cpp" ],
946 "qasymm8_signed": [ "src/cpu/kernels/add/generic/sve2/qasymm8_signed.cpp" ],
947 "qsymm16": [ "src/cpu/kernels/add/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100948 }
949 }
950 },
Gunes Bayirae72a462023-01-29 13:24:24 +0000951 "AddMulAdd": {
952 "files": {
953 "common": [
954 "src/cpu/operators/CpuAddMulAdd.cpp",
955 "src/cpu/kernels/CpuAddMulAddKernel.cpp",
956 "src/runtime/NEON/functions/NEAddMulAdd.cpp"
957 ],
958 "neon": {
959 "fp32":["src/cpu/kernels/addmuladd/generic/neon/fp32.cpp"],
960 "fp16":["src/cpu/kernels/addmuladd/generic/neon/fp16.cpp"],
961 "qasymm8": ["src/cpu/kernels/addmuladd/generic/neon/qasymm8.cpp"],
962 "qasymm8_signed": ["src/cpu/kernels/addmuladd/generic/neon/qasymm8_signed.cpp"]
963 }
964 }
965 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100966 "BatchNormalize": {
Michalis Spyrou20fca522021-06-07 14:23:57 +0100967 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100968 "common": [
969 "src/core/NEON/kernels/NEBatchNormalizationLayerKernel.cpp",
970 "src/core/NEON/kernels/NEFuseBatchNormalizationKernel.cpp",
971 "src/runtime/NEON/functions/NEBatchNormalizationLayer.cpp",
972 "src/runtime/NEON/functions/NEFuseBatchNormalization.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100973 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100974 "neon": {
Yair Schwarzbaum41a729e2021-11-15 20:42:47 +0200975 "common": [
Pablo Marquez Tello7e589802023-09-14 09:41:37 +0100976 "src/cpu/kernels/fuse_batch_normalization/nchw/all.cpp"
Yair Schwarzbaum41a729e2021-11-15 20:42:47 +0200977 ],
978 "fp16": [
979 "src/cpu/kernels/fuse_batch_normalization/generic/fp16.cpp",
980 "src/core/NEON/kernels/batchnormalization/impl/NEON/fp16.cpp",
981 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp16.cpp"
982 ],
983 "fp32": [
984 "src/cpu/kernels/fuse_batch_normalization/generic/fp32.cpp",
985 "src/core/NEON/kernels/batchnormalization/impl/NEON/fp32.cpp",
986 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp32.cpp"
987 ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100988 },
989 "sve": {
990 "fp16": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp16.cpp" ],
991 "fp32": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp32.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100992 }
993 }
994 },
995 "BatchToSpace": {
996 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100997 "common": [
998 "src/core/NEON/kernels/NEBatchToSpaceLayerKernel.cpp",
999 "src/runtime/NEON/functions/NEBatchToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001000 ]
1001 }
1002 },
1003 "BitwiseAnd": {
1004 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001005 "common": [
1006 "src/core/NEON/kernels/NEBitwiseAndKernel.cpp",
1007 "src/runtime/NEON/functions/NEBitwiseAnd.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001008 ]
1009 }
1010 },
1011 "BitwiseNot": {
1012 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001013 "common": [
1014 "src/core/NEON/kernels/NEBitwiseNotKernel.cpp",
1015 "src/runtime/NEON/functions/NEBitwiseNot.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001016 ]
1017 }
1018 },
1019 "BitwiseOr": {
1020 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001021 "common": [
1022 "src/core/NEON/kernels/NEBitwiseOrKernel.cpp",
1023 "src/runtime/NEON/functions/NEBitwiseOr.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001024 ]
1025 }
1026 },
1027 "BitwiseXor": {
1028 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001029 "common": [
1030 "src/core/NEON/kernels/NEBitwiseXorKernel.cpp",
1031 "src/runtime/NEON/functions/NEBitwiseXor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001032 ]
1033 }
1034 },
1035 "BoundingBoxTransform": {
1036 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001037 "common": [
1038 "src/core/NEON/kernels/NEBoundingBoxTransformKernel.cpp",
1039 "src/runtime/NEON/functions/NEBoundingBoxTransform.cpp"
Dana Zlotnik3475ffe2022-01-03 14:37:10 +02001040 ],
1041 "neon":{
1042 "common":["src/cpu/kernels/boundingboxtransform/generic/neon/impl.cpp"],
1043 "fp32":["src/cpu/kernels/boundingboxtransform/generic/neon/fp32.cpp"],
1044 "fp16":["src/cpu/kernels/boundingboxtransform/generic/neon/fp16.cpp"],
1045 "qsymm16":["src/cpu/kernels/boundingboxtransform/generic/neon/qsymm16.cpp"]
Dana Zlotnik3475ffe2022-01-03 14:37:10 +02001046 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001047 }
1048 },
1049 "Cast": {
1050 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001051 "common": [
1052 "src/cpu/operators/CpuCast.cpp",
1053 "src/cpu/kernels/CpuCastKernel.cpp",
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +02001054 "src/runtime/NEON/functions/NECast.cpp",
1055 "src/cpu/kernels/cast/generic/neon/bfloat16.cpp"
1056 ],
1057 "neon":{
1058 "fp16":["src/cpu/kernels/cast/generic/neon/fp16.cpp"]
1059 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001060 }
1061 },
1062 "ChannelShuffle": {
1063 "files": {
1064 "common": [
1065 "src/core/NEON/kernels/NEChannelShuffleLayerKernel.cpp",
1066 "src/runtime/NEON/functions/NEChannelShuffleLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001067 ]
1068 }
1069 },
1070 "Concatenate": {
1071 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001072 "common": [
1073 "src/cpu/operators/CpuConcatenate.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001074 "src/cpu/kernels/CpuConcatenateWidthKernel.cpp",
1075 "src/cpu/kernels/CpuConcatenateBatchKernel.cpp",
1076 "src/cpu/kernels/CpuConcatenateDepthKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001077 "src/cpu/kernels/CpuConcatenateHeightKernel.cpp",
1078 "src/runtime/NEON/functions/NEConcatenateLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001079 ]
1080 }
1081 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001082 "Conv2d": {
1083 "deps": [
1084 "Activation",
1085 "ElementwiseBinary",
1086 "FFT2D",
1087 "Gemm",
1088 "Mul",
1089 "Pad",
1090 "Permute",
1091 "Reshape",
1092 "Reverse",
1093 "Slice"
1094 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001095 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001096 "common": [
1097 "src/cpu/operators/CpuConv2d.cpp",
1098 "src/cpu/operators/CpuDirectConv2d.cpp",
1099 "src/cpu/operators/CpuGemmDirectConv2d.cpp",
1100 "src/cpu/operators/CpuGemmConv2d.cpp",
1101 "src/cpu/operators/CpuWinogradConv2d.cpp",
1102 "src/cpu/operators/internal/CpuGemmAssemblyDispatch.cpp",
1103 "src/cpu/kernels/CpuDirectConv2dKernel.cpp",
1104 "src/cpu/kernels/CpuDirectConv2dOutputStageKernel.cpp",
1105 "src/cpu/kernels/CpuWinogradConv2dKernel.cpp",
1106 "src/cpu/kernels/CpuCol2ImKernel.cpp",
1107 "src/cpu/kernels/CpuIm2ColKernel.cpp",
1108 "src/cpu/kernels/CpuWeightsReshapeKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001109 "src/runtime/NEON/functions/NEConvolutionLayer.cpp",
1110 "src/runtime/NEON/functions/NEDirectConvolutionLayer.cpp",
1111 "src/runtime/NEON/functions/NEFFTConvolutionLayer.cpp",
1112 "src/runtime/NEON/functions/NEGEMMConv2d.cpp",
1113 "src/runtime/NEON/functions/NEGEMMConvolutionLayer.cpp",
1114 "src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001115 ],
1116 "neon": {
1117 "common": [
1118 "src/core/NEON/kernels/convolution/common/padding.cpp",
1119 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1120 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1121 "src/core/NEON/kernels/convolution/common/utils.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001122 "src/core/NEON/kernels/convolution/winograd/input_transforms_fp16.cpp",
1123 "src/core/NEON/kernels/convolution/winograd/input_transforms_fp32.cpp",
1124 "src/core/NEON/kernels/convolution/winograd/output_transforms_fp16.cpp",
1125 "src/core/NEON/kernels/convolution/winograd/output_transforms_fp32.cpp",
1126 "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp16.cpp",
1127 "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp32.cpp",
1128 "src/core/NEON/kernels/convolution/winograd/winograd_fp16.cpp",
1129 "src/core/NEON/kernels/convolution/winograd/winograd_fp32.cpp",
1130 "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp16_6x6.cpp",
1131 "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp32_6x6.cpp",
1132 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_1x8.cpp",
1133 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_4x4.cpp",
1134 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_6x6.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001135 "src/core/NEON/kernels/convolution/winograd/output_transforms/a64_fp16_4x4_3x3.cpp",
1136 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x2_1x7.cpp",
1137 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x4_1x5.cpp",
1138 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x6_1x3.cpp",
1139 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_3x3.cpp",
1140 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_5x5.cpp",
1141 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_4x4_3x3.cpp",
1142 "src/core/NEON/kernels/convolution/winograd/weight_transforms/a64_fp16_4x4_3x3.cpp",
1143 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_3x3.cpp",
1144 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_5x5.cpp",
1145 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_4x4_3x3.cpp",
1146 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x2_1x7.cpp",
1147 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x4_1x5.cpp",
1148 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x6_1x3.cpp",
alerah01c9e519d2022-01-31 19:04:10 +02001149 "src/cpu/kernels/directconv2d/nhwc/neon/impl.cpp",
1150 "src/cpu/kernels/directconv2d/nchw/all.cpp"
1151 ],
1152 "fp32": [
1153 "src/cpu/kernels/directconv2d/nhwc/neon/fp32.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001154 ]
ramelg0199c46472022-07-15 13:08:39 +01001155 },
1156 "sve": {
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001157 "common": [
1158 "src/core/NEON/kernels/convolution/winograd/input_transforms/sve_fp32_6x6.cpp",
1159 "src/core/NEON/kernels/convolution/winograd/input_transforms/sme_fp32_mla_6x6.cpp",
1160 "src/core/NEON/kernels/convolution/winograd/output_transforms/sme_fp32_mopa_4x4_3x3.cpp"
1161 ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001162 }
Michalis Spyroub55f8e82021-07-22 11:23:11 +01001163 }
1164 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001165 "Copy": {
1166 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001167 "common": [
1168 "src/cpu/operators/CpuCopy.cpp",
1169 "src/cpu/kernels/CpuCopyKernel.cpp",
1170 "src/runtime/NEON/functions/NECopy.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001171 ]
1172 }
1173 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001174 "CropResize": {
1175 "deps": [ "Scale" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001176 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001177 "common": [
1178 "src/core/NEON/kernels/NECropKernel.cpp",
1179 "src/runtime/NEON/functions/NECropResize.cpp"
alerah0127619932021-11-24 17:21:43 +02001180 ],
1181 "neon": {
alerah0127619932021-11-24 17:21:43 +02001182 "fp32": [ "src/cpu/kernels/crop/generic/neon/fp32.cpp" ],
1183 "fp16": [ "src/cpu/kernels/crop/generic/neon/fp16.cpp" ],
1184 "integer": [ "src/cpu/kernels/crop/generic/neon/integer.cpp" ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001185 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001186 }
1187 },
1188 "Deconv2d": {
1189 "deps": [ "Conv2d", "Reverse", "Transpose"],
1190 "files": {
1191 "common": [
1192 "src/runtime/NEON/functions/NEDeconvolutionLayer.cpp"
1193 ]
1194 }
1195 },
1196 "DepthConvert": {
1197 "deps": [ "Cast"],
1198 "files": {
1199 "common": [
1200 "src/runtime/NEON/functions/NEDepthConvertLayer.cpp"
1201 ]
1202 }
1203 },
1204 "DepthToSpace": {
1205 "files": {
1206 "common": [
1207 "src/core/NEON/kernels/NEDepthToSpaceLayerKernel.cpp",
1208 "src/runtime/NEON/functions/NEDepthToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001209 ]
1210 }
1211 },
1212 "DepthwiseConv2d": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001213 "deps": [ "Activation", "Permute" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001214 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001215 "common": [
Georgios Pinitas7891a732021-08-20 21:39:25 +01001216 "src/cpu/operators/CpuDepthwiseConv2d.cpp",
1217 "src/cpu/operators/CpuDepthwiseConv2dAssemblyDispatch.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001218 "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.cpp",
1219 "src/cpu/kernels/internal/CpuDepthwiseConv2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001220 "src/runtime/NEON/functions/NEDepthwiseConvolutionLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001221 ],
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001222 "neon": {
1223 "common": [
1224 "src/core/NEON/kernels/convolution/common/padding.cpp",
1225 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1226 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1227 "src/core/NEON/kernels/convolution/common/utils.cpp",
ramelg01c827e992022-04-08 03:52:28 +01001228 "src/core/NEON/kernels/arm_conv/addressing.cpp",
Pablo Marquez Tello4e2bbbb2023-01-09 17:21:01 +00001229 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_common.cpp",
ramelg018a164882022-04-07 02:42:52 +01001230 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_strategies_common.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001231 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8q.cpp",
1232 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8s8u8q.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001233 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_s8q.cpp",
1234 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp32.cpp",
1235 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1236 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1237 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1238 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1239 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1240 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1241 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1242 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1243 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1244 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1245 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
ramelg018a164882022-04-07 02:42:52 +01001246 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp16.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001247 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1248 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1249 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1250 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1251 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1252 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1253 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1254 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1255 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1256 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1257 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1258 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1259 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1260 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1261 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1262 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1263 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1264 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1265 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1266 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1267 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1268 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1269 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1270 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1271 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1272 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1273 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1274 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1275 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1276 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1277 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1278 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1279 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1280 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1281 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1282 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1283 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
ramelg018a164882022-04-07 02:42:52 +01001284 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1285 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1286 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001287 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_s8q_3x3_dot.cpp",
ramelg01c827e992022-04-08 03:52:28 +01001288 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_u8q_3x3_dot.cpp",
ramelg018a164882022-04-07 02:42:52 +01001289 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic.cpp",
1290 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic_quantized_dot_product.cpp",
Michael Tyler8deee9b2023-06-30 11:26:05 +01001291 "src/core/NEON/kernels/arm_conv/depthwise/premultiply.cpp",
Dana Zlotnikebbae942022-02-03 12:52:15 +02001292 "src/cpu/kernels/depthwiseconv2d/generic/neon/impl.cpp"
ramelg01a1f78512022-06-29 16:28:10 +01001293 ],
Dana Zlotnikebbae942022-02-03 12:52:15 +02001294 "fp16":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp16.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01001295 "fp32":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp32.cpp"],
1296 "qasymm8":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8.cpp"],
Dana Zlotnikebbae942022-02-03 12:52:15 +02001297 "qasymm8_signed":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8_signed.cpp"]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001298 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001299 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001300 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001301 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_s8q_3x3_dot.cpp",
1302 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_u8q_3x3_dot.cpp",
1303 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1304 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1305 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1306 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1307 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1308 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1309 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1310 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1311 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1312 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001313 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1314 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001315 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1316 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1317 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1318 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1319 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1320 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1321 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1322 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1323 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1324 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1325 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1326 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1327 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1328 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1329 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1330 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1331 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1332 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1333 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1334 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1335 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1336 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1337 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1338 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1339 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1340 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1341 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001342 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
David Mansellb2758f32023-03-30 19:10:52 +01001343 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1344 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1345 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1346 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1347 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1348 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1349 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1350 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1351 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1352 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001353 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1354 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1355 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1356 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1357 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1358 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1359 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1360 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1361 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s1_4rows_mla_za/generic.cpp",
1362 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s2_4rows_mla_za/generic.cpp",
1363 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s1_4rows_mla_za/generic.cpp",
1364 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s2_4rows_mla_za/generic.cpp",
1365 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za/generic.cpp",
1366 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za/generic.cpp",
1367 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za/generic.cpp",
1368 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za/generic.cpp",
1369 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001370 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1371 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1372 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1373 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001374 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1375 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1376 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1377 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001378 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1379 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1380 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001381 ]
1382 }
1383 }
1384 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001385 "Dequantize": {
1386 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001387 "common": [
1388 "src/cpu/operators/CpuDequantize.cpp",
1389 "src/cpu/kernels/CpuDequantizeKernel.cpp",
1390 "src/runtime/NEON/functions/NEDequantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001391 ]
1392 }
1393 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001394 "DetectionPostProcess": {
1395 "deps": [ "Dequantize" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001396 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001397 "common" : [ "src/runtime/NEON/functions/NEDetectionPostProcessLayer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001398 }
1399 },
Sheri Zhang6d9c9822021-09-24 16:02:57 +01001400 "Conv3d": {
1401 "deps": [
1402 "Activation"
1403 ],
1404 "files": {
1405 "common": [
1406 "src/cpu/operators/CpuDirectConv3d.cpp",
1407 "src/cpu/kernels/CpuDirectConv3dKernel.cpp",
1408 "src/runtime/NEON/functions/NEConv3D.cpp"
1409 ]
1410 }
1411 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001412 "ElementwiseBinary": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001413 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001414 "common": [
1415 "src/cpu/operators/CpuElementwise.cpp",
1416 "src/cpu/kernels/CpuElementwiseKernel.cpp",
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001417 "src/runtime/NEON/functions/NEElementwiseOperations.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001418 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001419 "neon":{
1420 "fp32": ["src/cpu/kernels/elementwise_binary/generic/neon/fp32.cpp"],
1421 "fp16": ["src/cpu/kernels/elementwise_binary/generic/neon/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001422 "integer": ["src/cpu/kernels/elementwise_binary/generic/neon/integer.cpp"],
1423 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8.cpp"],
1424 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001425 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001426 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001427 "common": ["src/cpu/kernels/elementwise_binary/generic/sve/impl.cpp" ],
1428 "integer": ["src/cpu/kernels/elementwise_binary/generic/sve/integer.cpp"],
1429 "fp32": ["src/cpu/kernels/elementwise_binary/generic/sve/fp32.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001430 "fp16": ["src/cpu/kernels/elementwise_binary/generic/sve/fp16.cpp"]
1431
ramelg01a1f78512022-06-29 16:28:10 +01001432 },
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001433 "sve2":{
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001434 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8.cpp"],
1435 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001436 }
1437 }
1438 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001439 "ElementwiseUnary":{
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001440 "deps": [ "LUT" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001441 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001442 "common": [
1443 "src/cpu/operators/CpuElementwiseUnary.cpp",
1444 "src/cpu/kernels/CpuElementwiseUnaryKernel.cpp",
1445 "src/runtime/NEON/functions/NEElementwiseUnaryLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001446 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001447 "neon": {
1448 "integer": ["src/cpu/kernels/elementwise_unary/generic/neon/integer.cpp"],
1449 "fp32": ["src/cpu/kernels/elementwise_unary/generic/neon/fp32.cpp"],
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001450 "fp16": ["src/cpu/kernels/elementwise_unary/generic/neon/fp16.cpp"],
Ramy Elgammal8b7f42a2023-03-31 16:16:15 +01001451 "qasymm8": [
1452 "src/cpu/kernels/elementwise_unary/generic/neon/q8.cpp",
1453 "src/cpu/kernels/elementwise_unary/generic/neon/qasymm8.cpp"
1454 ],
1455 "qasymm8_signed": [
1456 "src/cpu/kernels/elementwise_unary/generic/neon/q8.cpp",
1457 "src/cpu/kernels/elementwise_unary/generic/neon/qasymm8_signed.cpp"
1458 ]
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001459 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001460 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001461 "common": ["src/cpu/kernels/elementwise_unary/generic/sve/impl.cpp" ],
1462 "integer": ["src/cpu/kernels/elementwise_unary/generic/sve/integer.cpp"],
1463 "fp32": ["src/cpu/kernels/elementwise_unary/generic/sve/fp32.cpp"],
SiCong Lic0463a22023-05-17 13:46:13 +01001464 "fp16": ["src/cpu/kernels/elementwise_unary/generic/sve/fp16.cpp"]
1465 },
1466 "sve2": {
1467 "qasymm8": ["src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp"],
1468 "qasymm8_signed": ["src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001469 }
1470 }
1471 },
1472 "FFT1D": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001473 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001474 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001475 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001476 "src/core/NEON/kernels/NEFFTDigitReverseKernel.cpp",
1477 "src/core/NEON/kernels/NEFFTRadixStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001478 "src/core/NEON/kernels/NEFFTScaleKernel.cpp",
1479 "src/runtime/NEON/functions/NEFFT1D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001480 ]
1481 }
1482 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001483 "FFT2D": {
1484 "deps": [ "FFT1D" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001485 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001486 "common": [
1487 "src/runtime/NEON/functions/NEFFT2D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001488 ]
1489 }
1490 },
1491 "Fill": {
1492 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001493 "common": [
1494 "src/cpu/operators/CpuFill.cpp",
1495 "src/cpu/kernels/CpuFillKernel.cpp",
1496 "src/runtime/NEON/functions/NEFill.cpp"
1497 ]
1498 }
1499 },
1500 "Flatten": {
1501 "deps: ": [ "Reshape" ],
1502 "files": {
1503 "common": [
1504 "src/cpu/operators/CpuFlatten.cpp",
1505 "src/runtime/NEON/functions/NEFlattenLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001506 ]
1507 }
1508 },
1509 "Floor": {
1510 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001511 "common": [
1512 "src/cpu/operators/CpuFloor.cpp",
1513 "src/cpu/kernels/CpuFloorKernel.cpp",
1514 "src/runtime/NEON/functions/NEFloor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001515 ],
1516 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001517 "fp32": [ "src/cpu/kernels/floor/neon/fp32.cpp" ],
1518 "fp16": [ "src/cpu/kernels/floor/neon/fp16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001519 }
1520 }
1521 },
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001522 "FullyConnected": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001523 "deps": [ "Flatten", "Gemm", "Transpose"],
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001524 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001525 "common": [
1526 "src/cpu/kernels/CpuConvertFullyConnectedWeightsKernel.cpp",
1527 "src/cpu/operators/CpuConvertFullyConnectedWeights.cpp",
1528 "src/cpu/operators/CpuFullyConnected.cpp",
1529 "src/runtime/NEON/functions/NEConvertFullyConnectedWeights.cpp",
1530 "src/runtime/NEON/functions/NEFullyConnectedLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001531 ]
1532 }
1533 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001534 "Gather": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001535 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001536 "common": [
1537 "src/core/NEON/kernels/NEGatherKernel.cpp",
1538 "src/runtime/NEON/functions/NEGather.cpp"
1539 ]
1540 }
1541 },
1542 "Gemm": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001543 "deps": [ "Quantize", "Add"],
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001544 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001545 "common": [
1546 "src/cpu/kernels/CpuConvertQuantizedSignednessKernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001547 "src/cpu/kernels/CpuGemmMatrixAdditionKernel.cpp",
1548 "src/cpu/kernels/CpuGemmMatrixMultiplyKernel.cpp",
1549 "src/cpu/kernels/CpuGemmTranspose1xWKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001550 "src/cpu/kernels/CpuGemmInterleave4x4Kernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001551 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ScaleKernel.cpp",
1552 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt16ScaleByFixedPointKernel.cpp",
1553 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt8ScaleByFixedPointKernel.cpp",
1554 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToUint8ScaleByFixedPointKernel.cpp",
1555 "src/cpu/kernels/CpuGemmLowpMatrixMultiplyKernel.cpp",
1556 "src/cpu/kernels/CpuGemmLowpMatrixReductionKernel.cpp",
1557 "src/cpu/kernels/CpuGemmLowpOffsetContributionOutputStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001558 "src/cpu/kernels/CpuGemmLowpOffsetContributionKernel.cpp",
1559 "src/cpu/operators/CpuGemm.cpp",
1560 "src/cpu/operators/CpuGemmLowpOutputStage.cpp",
1561 "src/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001562 "src/runtime/NEON/functions/NEGEMM.cpp",
1563 "src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001564 "src/runtime/NEON/functions/NEGEMMLowpOutputStage.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001565 ],
1566 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001567 "common": [
1568 "src/core/NEON/kernels/arm_gemm/gemm_bf16.cpp",
1569 "src/core/NEON/kernels/arm_gemm/gemm_fp16.cpp",
1570 "src/core/NEON/kernels/arm_gemm/gemm_fp32.cpp",
1571 "src/core/NEON/kernels/arm_gemm/gemm_int16.cpp",
1572 "src/core/NEON/kernels/arm_gemm/gemm_int8.cpp",
1573 "src/core/NEON/kernels/arm_gemm/gemm_qint8.cpp",
1574 "src/core/NEON/kernels/arm_gemm/gemm_quint8.cpp",
1575 "src/core/NEON/kernels/arm_gemm/gemm_uint16.cpp",
1576 "src/core/NEON/kernels/arm_gemm/gemm_uint8.cpp",
1577 "src/core/NEON/kernels/arm_gemm/interleave_indirect.cpp",
1578 "src/core/NEON/kernels/arm_gemm/mergeresults-fp16.cpp",
1579 "src/core/NEON/kernels/arm_gemm/mergeresults.cpp",
1580 "src/core/NEON/kernels/arm_gemm/misc.cpp",
1581 "src/core/NEON/kernels/arm_gemm/quantized.cpp",
1582 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_s8.cpp",
1583 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_u8.cpp",
1584 "src/core/NEON/kernels/arm_gemm/transform.cpp",
1585 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s16_8x12/generic.cpp",
1586 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_4x4/generic.cpp",
1587 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/a55r1.cpp",
1588 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/generic.cpp",
1589 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/x1.cpp",
1590 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u16_8x12/generic.cpp",
1591 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4/generic.cpp",
1592 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/a55r1.cpp",
1593 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/generic.cpp",
1594 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/x1.cpp",
1595 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/a55r1.cpp",
1596 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/generic.cpp",
1597 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/x1.cpp",
1598 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_dot_6x16/generic.cpp",
1599 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_mmla_6x16/generic.cpp",
1600 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/a55.cpp",
1601 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/generic.cpp",
1602 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/a55.cpp",
1603 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/generic.cpp",
1604 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/a55.cpp",
1605 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/generic.cpp",
1606 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/a55.cpp",
1607 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/generic.cpp",
1608 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1609 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_6x16/generic.cpp",
1610 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/a55.cpp",
1611 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/generic.cpp",
1612 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_mmla_4x16/generic.cpp",
1613 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/a55.cpp",
1614 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/generic.cpp",
1615 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_mmla_6x16/generic.cpp",
1616 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/a55.cpp",
1617 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/generic.cpp",
1618 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_mmla_6x16/generic.cpp",
1619 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/a55.cpp",
1620 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/generic.cpp",
1621 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_mmla_4x16/generic.cpp",
1622 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/a55.cpp",
1623 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/generic.cpp",
1624 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_mmla_6x16/generic.cpp",
1625 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/generic.cpp",
1626 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/x1.cpp",
1627 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/generic.cpp",
1628 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/a510.cpp",
1629 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/generic.cpp",
1630 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/a510.cpp",
1631 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/generic.cpp",
1632 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/a510.cpp",
1633 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a53.cpp",
1634 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55.cpp",
1635 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55r1.cpp",
1636 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/generic.cpp",
1637 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/x1.cpp",
1638 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x6/generic.cpp",
1639 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_6x4/generic.cpp",
1640 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_8x4/generic.cpp",
1641 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/a55.cpp",
1642 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/generic.cpp",
1643 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/a55.cpp",
1644 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/generic.cpp",
1645 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/a55.cpp",
1646 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/generic.cpp",
1647 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/a55.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001648 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/generic.cpp",
Dana Zlotnik256ac622022-02-02 15:06:11 +02001649 "src/cpu/kernels/gemm_matrix_mul/generic/neon/impl.cpp",
1650 "src/cpu/kernels/gemm_matrix_add/generic/neon/impl.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001651 ],
Dana Zlotnik256ac622022-02-02 15:06:11 +02001652 "fp32":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp32.cpp",
1653 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp32.cpp"],
1654 "fp16":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp16.cpp",
1655 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp16.cpp"],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001656 "estate32": [
1657 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a53.cpp",
1658 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a55r1.cpp",
1659 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/generic.cpp"
1660 ],
1661 "estate64": [
Freddie Liardet487d3902021-09-21 12:36:43 +01001662 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemv_pretransposed/generic.cpp"
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001663 ],
Nathan John Sircombed7113e42023-04-26 15:02:43 +01001664 "fixed_format_kernels": [
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001665 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_bf16fp32_mmla_6x16/generic.cpp",
1666 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp16_mla_6x32/generic.cpp",
1667 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32_mla_6x16/generic.cpp",
1668 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1669 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_dot_8x12/generic.cpp",
1670 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_mmla_8x12/generic.cpp",
1671 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp16_mla_8x24/generic.cpp",
1672 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp32_mla_8x12/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001673 ]
1674 },
1675 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001676 "common": [
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001677 "src/core/NEON/kernels/arm_gemm/interleave_indirect-sve.cpp",
1678 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_bf16fp32_dot_16VL/generic.cpp",
1679 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32_mla_16VL/generic.cpp",
1680 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32bf16fp32_dot_16VL/generic.cpp",
1681 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_s8qa_dot_16VL/generic.cpp",
1682 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_u8qa_dot_16VL/generic.cpp",
1683 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_1VLx4VL/generic.cpp",
1684 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_2VLx2VL/generic.cpp",
1685 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_4VLx1VL/generic.cpp",
David Mansellaaa9da12023-03-10 13:48:50 +00001686 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_1VLx4VL/generic.cpp",
1687 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_2VLx2VL/generic.cpp",
1688 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_4VLx1VL/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001689 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_1VLx4VL/generic.cpp",
1690 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_2VLx2VL/generic.cpp",
1691 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_4VLx1VL/generic.cpp",
1692 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_1VLx4VL/generic.cpp",
1693 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_2VLx2VL/generic.cpp",
1694 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_4VLx1VL/generic.cpp",
1695 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_1VLx4VL/generic.cpp",
1696 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_2VLx2VL/generic.cpp",
1697 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_4VLx1VL/generic.cpp",
1698 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_1VLx4VL/generic.cpp",
1699 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_2VLx2VL/generic.cpp",
1700 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_4VLx1VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001701 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001702 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1703 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001704 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001705 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001706 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001707 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001708 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001709 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1710 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001711 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001712 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_mmla_4x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001713 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001714 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_mmla_6x4VL/generic.cpp",
1715 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001716 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001717 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001718 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001719 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_mmla_4x4VL/generic.cpp",
1720 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001721 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001722 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001723 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_dot_8x3VL/generic.cpp",
1724 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001725 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001726 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001727 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001728 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/generic.cpp",
1729 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001730 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001731 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/generic.cpp",
1732 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001733 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001734 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/generic.cpp",
1735 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001736 "src/core/NEON/kernels/arm_gemm/mergeresults-sve.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001737 "src/core/NEON/kernels/arm_gemm/transform-sve.cpp",
1738 "src/core/NEON/kernels/arm_gemm/misc-sve.cpp"
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001739 ],
Nathan John Sircombed7113e42023-04-26 15:02:43 +01001740 "fixed_format_kernels": [
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001741 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1742 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/a64fx.cpp",
1743 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/generic.cpp",
1744 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/a64fx.cpp",
1745 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/generic.cpp",
1746 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1747 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_bf16fp32_mmla_8x3VL/generic.cpp",
1748 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/a64fx.cpp",
1749 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/generic.cpp",
1750 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/a64fx.cpp",
1751 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/generic.cpp"
1752 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001753 }
1754 }
1755 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001756 "GenerateProposals": {
1757 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001758 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001759 "common": [
1760 "src/core/NEON/kernels/NEGenerateProposalsLayerKernel.cpp",
1761 "src/runtime/NEON/functions/NEGenerateProposalsLayer.cpp"
Dana Zlotnik50ce2772021-12-29 13:55:56 +02001762 ],
1763 "neon":{
1764 "common":["src/cpu/kernels/genproposals/generic/neon/impl.cpp"],
1765 "fp16":["src/cpu/kernels/genproposals/generic/neon/fp16.cpp"],
1766 "fp32":["src/cpu/kernels/genproposals/generic/neon/fp32.cpp"],
1767 "qsymm16":["src/cpu/kernels/genproposals/generic/neon/qsymm16.cpp"]
1768 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001769 }
1770 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001771 "InstanceNormalize": {
1772 "deps": [ "Permute", "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001773 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001774 "common": [
1775 "src/core/NEON/kernels/NEInstanceNormalizationLayerKernel.cpp",
1776 "src/runtime/NEON/functions/NEInstanceNormalizationLayer.cpp"
ramelg01a1f78512022-06-29 16:28:10 +01001777 ],
Dana Zlotnikd7e2ec52022-01-03 10:59:41 +02001778 "neon":{
1779 "common":["src/cpu/kernels/instancenorm/generic/neon/impl.cpp"],
1780 "fp16":["src/cpu/kernels/instancenorm/generic/neon/fp16.cpp"],
1781 "fp32":["src/cpu/kernels/instancenorm/generic/neon/fp32.cpp"]
1782 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001783 }
1784 },
1785 "L2Normalize": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001786 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001787 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001788 "common": [
1789 "src/core/NEON/kernels/NEL2NormalizeLayerKernel.cpp",
1790 "src/runtime/NEON/functions/NEL2NormalizeLayer.cpp"
Yair Schwarzbaum5e993182022-01-10 15:11:07 +02001791 ],
1792 "neon":{
1793 "common":["src/cpu/kernels/l2normlayer/generic/neon/impl.cpp"],
1794 "fp32":["src/cpu/kernels/l2normlayer/generic/neon/fp32.cpp"],
1795 "fp16":["src/cpu/kernels/l2normlayer/generic/neon/fp16.cpp"]
1796 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001797 }
1798 },
1799 "Logical": {
1800 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001801 "common": [
1802 "src/core/NEON/kernels/NELogicalKernel.cpp",
1803 "src/runtime/NEON/functions/NELogical.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001804 ]
1805 }
1806 },
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001807 "LUT": {
1808 "files": {
1809 "common": [],
1810 "neon":{
1811 "qasymm8": ["src/cpu/kernels/lut/generic/neon/u8.cpp"],
1812 "qasymm8_signed": ["src/cpu/kernels/lut/generic/neon/u8.cpp"]
1813 },
SiCong Lic0463a22023-05-17 13:46:13 +01001814 "sve2": {
1815 "qasymm8": ["src/cpu/kernels/lut/generic/sve2/u8.cpp"],
1816 "qasymm8_signed": ["src/cpu/kernels/lut/generic/sve2/u8.cpp"]
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001817 }
1818 }
1819 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001820 "LSTM": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001821 "deps": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001822 "Activation",
1823 "Concatenate",
1824 "Copy",
1825 "Dequantize",
1826 "ElementwiseBinary",
1827 "Fill",
1828 "FullyConnected",
1829 "Gemm",
1830 "MeanStdDevNormalize",
1831 "Mul",
1832 "Quantize",
1833 "Slice",
1834 "Transpose"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001835 ],
1836 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001837 "common": [
1838 "src/core/NEON/kernels/NEQLSTMLayerNormalizationKernel.cpp",
1839 "src/runtime/NEON/functions/NELSTMLayer.cpp",
1840 "src/runtime/NEON/functions/NELSTMLayerQuantized.cpp",
1841 "src/runtime/NEON/functions/NEQLSTMLayer.cpp"
1842 ]
1843 }
1844 },
1845 "MaxUnpool2d": {
1846 "deps": [ "Fill" ],
1847 "files": {
1848 "common": [
Dana Zlotnik149203b2022-01-26 12:38:03 +02001849 "src/cpu/kernels/CpuMaxUnpoolingLayerKernel.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001850 "src/runtime/NEON/functions/NEMaxUnpoolingLayer.cpp",
Dana Zlotnik149203b2022-01-26 12:38:03 +02001851 "src/cpu/operators/CpuMaxUnpooling.cpp"
Dana Zlotnik143310c2021-12-30 13:24:52 +02001852 ],
1853 "neon":{
Dana Zlotnik143310c2021-12-30 13:24:52 +02001854 "fp32":["src/cpu/kernels/maxunpool/generic/neon/fp32.cpp"],
1855 "fp16":["src/cpu/kernels/maxunpool/generic/neon/fp16.cpp"],
1856 "qasymm8":["src/cpu/kernels/maxunpool/generic/neon/qasymm8.cpp"],
Dana Zlotnik149203b2022-01-26 12:38:03 +02001857 "qasymm8_signed":[ "src/cpu/kernels/maxunpool/generic/neon/qasymm8_signed.cpp"],
1858 "common":["src/cpu/kernels/maxunpool/generic/neon/impl.cpp"]
Dana Zlotnik143310c2021-12-30 13:24:52 +02001859 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001860 }
1861 },
1862 "Mean": {
1863 "deps" : [ "Reduction" ],
1864 "files": {
1865 "common": [ "src/runtime/NEON/functions/NEReduceMean.cpp" ]
1866 }
1867 },
1868 "MeanStdDevNormalize": {
1869 "files": {
1870 "common": [
1871 "src/core/NEON/kernels/NEMeanStdDevNormalizationKernel.cpp",
1872 "src/runtime/NEON/functions/NEMeanStdDevNormalizationLayer.cpp"
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001873 ],
1874 "neon":{
1875 "common":["src/cpu/kernels/meanstddevnorm/generic/neon/impl.cpp"],
1876 "fp32":["src/cpu/kernels/meanstddevnorm/generic/neon/fp32.cpp"],
Murray Kornelsen6e09e142022-07-13 21:40:26 -04001877 "fp16":["src/cpu/kernels/meanstddevnorm/generic/neon/fp16.cpp"],
1878 "qasymm8":["src/cpu/kernels/meanstddevnorm/generic/neon/qasymm8.cpp"]
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001879 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001880 }
1881 },
Mohammed Suhail Munshia1b1e412023-03-23 22:21:31 +00001882 "MatMul" : {
Viet-Hoa Do99b6fd22023-04-27 17:06:10 +01001883 "deps": [ "Transpose" ],
Mohammed Suhail Munshia1b1e412023-03-23 22:21:31 +00001884 "files": {
1885 "common": [
1886 "src/cpu/operators/CpuMatMul.cpp",
1887 "src/runtime/NEON/functions/NEMatMul.cpp"
1888 ]
1889 }
1890 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001891 "Mul": {
1892 "files": {
1893 "common": [
1894 "src/cpu/operators/CpuMul.cpp",
1895 "src/cpu/kernels/CpuMulKernel.cpp",
1896 "src/runtime/NEON/functions/NEPixelWiseMultiplication.cpp"
1897 ]
1898 }
1899 },
1900 "Normalize": {
1901 "deps": [ "Mul" ],
1902 "files": {
1903 "common": [
1904 "src/core/NEON/kernels/NENormalizationLayerKernel.cpp",
1905 "src/runtime/NEON/functions/NENormalizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001906 ]
1907 }
1908 },
1909 "Pad": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001910 "deps": [ "Concatenate", "Copy", "StridedSlice" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001911 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001912 "common": [
1913 "src/core/NEON/kernels/NEPadLayerKernel.cpp",
1914 "src/runtime/NEON/functions/NEPadLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001915 ]
1916 }
1917 },
1918 "Permute": {
1919 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001920 "common": [
1921 "src/cpu/operators/CpuPermute.cpp",
1922 "src/cpu/kernels/CpuPermuteKernel.cpp",
1923 "src/runtime/NEON/functions/NEPermute.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001924 ]
1925 }
1926 },
1927 "Pool2d": {
1928 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001929 "common": [
1930 "src/cpu/operators/CpuPool2d.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001931 "src/cpu/kernels/CpuPool2dKernel.cpp",
1932 "src/cpu/kernels/internal/CpuPool2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001933 "src/runtime/NEON/functions/NEPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001934 ],
1935 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001936 "common": [
1937 "src/core/NEON/kernels/arm_conv/pooling/kernels/cpp_nhwc_1x1_stride_any_depthfirst/generic.cpp",
1938 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp16.cpp",
1939 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp32.cpp",
1940 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8.cpp",
1941 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8q.cpp",
1942 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8.cpp",
1943 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8q.cpp",
1944 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1945 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1946 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1947 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1948 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1949 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1950 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1951 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1952 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1953 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1954 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_generic_depthfirst/generic.cpp",
1955 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1956 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1957 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1958 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1959 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_generic_depthfirst/generic.cpp",
1960 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001961 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001962 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001963 "nchw": [ "src/cpu/kernels/pool2d/neon/nchw/all.cpp" ],
1964 "fp16": [ "src/cpu/kernels/pool2d/neon/fp16.cpp" ],
ramelg01a1f78512022-06-29 16:28:10 +01001965 "fp32": [ "src/cpu/kernels/pool2d/neon/fp32.cpp" ],
1966 "qasymm8":[ "src/cpu/kernels/pool2d/neon/qasymm8.cpp" ],
Dana Zlotnika538ae52022-02-21 13:12:41 +02001967 "qasymm8_signed":["src/cpu/kernels/pool2d/neon/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001968 },
1969 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001970 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001971 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1972 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1973 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1974 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_generic_depthfirst/generic.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001975 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1976 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1977 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1978 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_generic_depthfirst/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001979 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1980 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1981 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_generic_depthfirst/generic.cpp",
1982 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1983 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1984 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1985 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1986 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_generic_depthfirst/generic.cpp",
1987 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001988 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_max_generic_depthfirst/generic.cpp",
1989 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1990 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1991 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1992 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1993 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1994 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1995 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1996 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1997 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1998 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1999 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_generic_depthfirst/generic.cpp",
2000 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
2001 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_max_generic_depthfirst/generic.cpp",
2002 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_avg_generic_depthfirst/generic.cpp",
2003 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
2004 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_generic_depthfirst/generic.cpp",
2005 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
2006 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002007 ]
2008 }
2009 }
2010 },
Adnan AlSinan171fc3d2022-03-15 18:46:42 +00002011 "Pool3d": {
2012 "files": {
2013 "common": [
2014 "src/cpu/operators/CpuPool3d.cpp",
2015 "src/cpu/kernels/CpuPool3dKernel.cpp",
2016 "src/runtime/NEON/functions/NEPooling3dLayer.cpp"
2017 ],
2018 "neon": {
Adnan AlSinan9104cd52022-04-06 16:19:31 +01002019 "fp16": [ "src/cpu/kernels/pool3d/neon/fp16.cpp" ],
2020 "fp32": [ "src/cpu/kernels/pool3d/neon/fp32.cpp" ],
2021 "qasymm8": [ "src/cpu/kernels/pool3d/neon/qasymm8.cpp" ],
2022 "qasymm8_signed": [ "src/cpu/kernels/pool3d/neon/qasymm8_signed.cpp" ]
Adnan AlSinan171fc3d2022-03-15 18:46:42 +00002023 }
2024 }
2025 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002026 "PRelu": {
2027 "deps": [ "ElementwiseBinary" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01002028 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002029 "common": [
2030 "src/runtime/NEON/functions/NEPReluLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002031 ]
2032 }
2033 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002034 "PriorBox": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002035 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002036 "common": [
2037 "src/core/NEON/kernels/NEPriorBoxLayerKernel.cpp",
2038 "src/runtime/NEON/functions/NEPriorBoxLayer.cpp"
2039 ]
2040 }
2041 },
2042 "Quantize": {
2043 "files": {
2044 "common": [
2045 "src/cpu/operators/CpuQuantize.cpp",
2046 "src/cpu/kernels/CpuQuantizeKernel.cpp",
2047 "src/runtime/NEON/functions/NEQuantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002048 ]
2049 }
2050 },
2051 "Range": {
2052 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002053 "common": [
2054 "src/core/NEON/kernels/NERangeKernel.cpp",
2055 "src/runtime/NEON/functions/NERange.cpp"
Yair Schwarzbaum9e8a7702021-11-08 10:58:06 +02002056 ],
2057 "neon": {
2058 "common": [ "src/cpu/kernels/range/generic/neon/impl.cpp" ],
2059 "fp32": [ "src/cpu/kernels/range/generic/neon/fp32.cpp" ],
2060 "fp16": [ "src/cpu/kernels/range/generic/neon/fp16.cpp" ],
2061 "integer": [ "src/cpu/kernels/range/generic/neon/integer.cpp" ]
2062 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002063 }
2064 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002065 "Reduction":{
2066 "deps": [ "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01002067 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002068 "common": [
2069 "src/core/NEON/kernels/NEReductionOperationKernel.cpp",
2070 "src/runtime/NEON/functions/NEReductionOperation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002071 ]
2072 }
2073 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002074 "Reorg": {
2075 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002076 "common": [
2077 "src/core/NEON/kernels/NEReorgLayerKernel.cpp",
2078 "src/runtime/NEON/functions/NEReorgLayer.cpp"
2079 ]
2080 }
2081 },
2082 "Reshape": {
2083 "files": {
2084 "common": [
2085 "src/cpu/operators/CpuReshape.cpp",
2086 "src/cpu/kernels/CpuReshapeKernel.cpp",
2087 "src/runtime/NEON/functions/NEReshapeLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002088 ]
2089 }
2090 },
David Svantesson3b162e52023-03-28 14:13:32 +00002091 "Reorder": {
2092 "files": {
2093 "common": [
David Svantessonf0ff76d2023-04-28 16:34:52 +00002094 "src/runtime/NEON/functions/NEReorderLayer.cpp",
David Svantesson3b162e52023-03-28 14:13:32 +00002095 "src/core/NEON/kernels/NEReorderKernel.cpp"
2096 ]
2097 }
2098 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002099 "Reverse": {
2100 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002101 "common": [
2102 "src/core/NEON/kernels/NEReverseKernel.cpp",
2103 "src/runtime/NEON/functions/NEReverse.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002104 ]
2105 }
2106 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002107 "RNN": {
2108 "deps": [ "Activation", "Add", "FullyConnected", "Gemm"],
2109 "files": {
2110 "common": [ "src/runtime/NEON/functions/NERNNLayer.cpp" ]
2111 }
2112 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002113 "ROIAlign": {
2114 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002115 "common": [
2116 "src/core/NEON/kernels/NEROIAlignLayerKernel.cpp",
2117 "src/runtime/NEON/functions/NEROIAlignLayer.cpp"
Dana Zlotnik9ae5a4e2022-01-03 16:22:47 +02002118 ],
2119 "neon":{
Dana Zlotnik9ae5a4e2022-01-03 16:22:47 +02002120 "fp32":["src/cpu/kernels/roialign/generic/neon/fp32.cpp"],
2121 "fp16":["src/cpu/kernels/roialign/generic/neon/fp16.cpp"],
2122 "qasymm8":["src/cpu/kernels/roialign/generic/neon/qasymm8.cpp"],
2123 "qasymm8_signed":["src/cpu/kernels/roialign/generic/neon/qasymm8_signed.cpp"]
2124 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002125 }
2126 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002127 "ROIPool2d": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002128 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002129 "common": [
2130 "src/core/NEON/kernels/NEROIPoolingLayerKernel.cpp",
2131 "src/runtime/NEON/functions/NEROIPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002132 ]
2133 }
2134 },
2135 "Scale": {
2136 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002137 "common": [
2138 "src/cpu/operators/CpuScale.cpp",
2139 "src/cpu/kernels/CpuScaleKernel.cpp",
2140 "src/runtime/NEON/functions/NEScale.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002141 ],
2142 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002143 "fp16": [ "src/cpu/kernels/scale/sve/fp16.cpp" ],
2144 "fp32": [ "src/cpu/kernels/scale/sve/fp32.cpp" ],
2145 "integer": [ "src/cpu/kernels/scale/sve/integer.cpp" ],
2146 "qasymm8": [ "src/cpu/kernels/scale/sve/qasymm8.cpp" ],
2147 "qasymm8_signed": [ "src/cpu/kernels/scale/sve/qasymm8_signed.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002148 },
2149 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002150 "fp16": [ "src/cpu/kernels/scale/neon/fp16.cpp" ],
2151 "integer": [ "src/cpu/kernels/scale/neon/integer.cpp" ],
Gunes Bayirc4f27432022-09-11 15:59:19 +01002152 "qasymm8": [ "src/cpu/kernels/scale/neon/qasymm8.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ],
2153 "qasymm8_signed": [ "src/cpu/kernels/scale/neon/qasymm8_signed.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002154 }
2155 }
2156 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002157 "Select": {
2158 "files": {
2159 "common": [
2160 "src/core/NEON/kernels/NESelectKernel.cpp",
2161 "src/runtime/NEON/functions/NESelect.cpp"
Anton Vainer8a9a0fb2022-01-09 14:37:12 +02002162 ],
2163 "neon": {
2164 "common": [ "src/cpu/kernels/select/generic/neon/impl.cpp" ],
2165 "fp32": [ "src/cpu/kernels/select/generic/neon/fp32.cpp" ],
2166 "fp16": [ "src/cpu/kernels/select/generic/neon/fp16.cpp" ],
2167 "integer": [ "src/cpu/kernels/select/generic/neon/integer.cpp" ]
2168 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002169 }
2170 },
2171 "Slice": {
2172 "deps": [ "StridedSlice" ],
2173 "files": {
2174 "common": [ "src/runtime/NEON/functions/NESlice.cpp" ]
2175 }
2176 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002177 "Softmax": {
2178 "deps": [
2179 "Permute"
2180 ],
2181 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002182 "common": [
2183 "src/cpu/operators/CpuSoftmax.cpp",
2184 "src/cpu/kernels/CpuSoftmaxKernel.cpp",
2185 "src/runtime/NEON/functions/NESoftmaxLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002186 ],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002187 "neon":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02002188 "common":["src/cpu/kernels/softmax/generic/neon/impl.cpp"],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002189 "fp32": ["src/cpu/kernels/softmax/generic/neon/fp32.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01002190 "fp16": ["src/cpu/kernels/softmax/generic/neon/fp16.cpp"],
2191 "qasymm8":[ "src/cpu/kernels/softmax/generic/neon/qasymm8.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002192 "qasymm8_signed":["src/cpu/kernels/softmax/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002193 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002194 "sve": {
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002195 "common": [ "src/cpu/kernels/softmax/generic/sve/impl.cpp" ],
2196 "fp32": ["src/cpu/kernels/softmax/generic/sve/fp32.cpp"],
2197 "fp16": ["src/cpu/kernels/softmax/generic/sve/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002198 "qasymm8": ["src/cpu/kernels/softmax/generic/sve/qasymm8.cpp" ],
2199 "qasymm8_signed": ["src/cpu/kernels/softmax/generic/sve/qasymm8_signed.cpp"]
2200 },
2201 "sve2":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02002202 "common" :["src/cpu/kernels/softmax/generic/sve2/impl.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01002203 "qasymm8":[ "src/cpu/kernels/softmax/generic/sve2/qasymm8.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002204 "qasymm8_signed":["src/cpu/kernels/softmax/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002205 }
2206 }
2207 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002208 "SpaceToBatch": {
2209 "files": {
2210 "common": [
2211 "src/core/NEON/kernels/NESpaceToBatchLayerKernel.cpp",
2212 "src/runtime/NEON/functions/NESpaceToBatchLayer.cpp"
2213 ]
2214 }
2215 },
2216 "SpaceToDepth": {
2217 "files": {
2218 "common": [
2219 "src/core/NEON/kernels/NESpaceToDepthLayerKernel.cpp",
2220 "src/runtime/NEON/functions/NESpaceToDepthLayer.cpp"
2221 ]
2222 }
2223 },
2224 "Split": {
2225 "deps": [ "StridedSlice" ],
2226 "files": {
2227 "common": [
2228 "src/runtime/NEON/functions/NESplit.cpp"
2229 ]
2230 }
2231 },
2232 "Stack": {
2233 "files": {
2234 "common": [
2235 "src/core/NEON/kernels/NEStackLayerKernel.cpp",
2236 "src/runtime/NEON/functions/NEStackLayer.cpp"
2237 ]
2238 }
2239 },
2240 "StridedSlice": {
2241 "files": {
2242 "common": [
2243 "src/core/NEON/kernels/NEStridedSliceKernel.cpp",
2244 "src/runtime/NEON/functions/NEStridedSlice.cpp"
2245 ]
2246 }
2247 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002248 "Sub": {
2249 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002250 "common": [
2251 "src/cpu/operators/CpuSub.cpp",
2252 "src/cpu/kernels/CpuSubKernel.cpp",
Freddie Liardet487d3902021-09-21 12:36:43 +01002253 "src/runtime/NEON/functions/NEArithmeticSubtraction.cpp",
2254 "src/cpu/kernels/sub/neon/qasymm8.cpp",
2255 "src/cpu/kernels/sub/neon/qasymm8_signed.cpp",
2256 "src/cpu/kernels/sub/neon/qsymm16.cpp"
2257 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002258 }
2259 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002260 "Tile": {
2261 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002262 "common": [
2263 "src/core/NEON/kernels/NETileKernel.cpp",
2264 "src/runtime/NEON/functions/NETile.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002265 ]
2266 }
2267 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002268 "Transpose": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002269 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002270 "common": [
2271 "src/cpu/kernels/CpuTransposeKernel.cpp",
2272 "src/cpu/operators/CpuTranspose.cpp",
2273 "src/runtime/NEON/functions/NETranspose.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002274 ]
2275 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002276 },
2277 "Unstack": {
2278 "deps": [ "StridedSlice" ],
2279 "files": {
2280 "common": [ "src/runtime/NEON/functions/NEUnstack.cpp" ]
2281 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002282 }
2283 }
Giorgio Arena232c4522022-03-03 10:09:01 +00002284 },
2285 "experimental": {
SiCong Li23882a92023-06-28 09:49:45 +01002286 "dynamic_fusion": {
2287 "common": [
2288 "src/dynamic_fusion/runtime/gpu/cl/ClKernelRuntime.cpp",
2289 "src/dynamic_fusion/runtime/gpu/cl/ClWorkloadRuntime.cpp",
2290 "src/dynamic_fusion/sketch/attributes/CastAttributes.cpp",
2291 "src/dynamic_fusion/sketch/attributes/ClampAttributes.cpp",
2292 "src/dynamic_fusion/sketch/attributes/Conv2dAttributes.cpp",
2293 "src/dynamic_fusion/sketch/attributes/DepthwiseConv2dAttributes.cpp",
2294 "src/dynamic_fusion/sketch/attributes/Pool2dAttributes.cpp",
2295 "src/dynamic_fusion/sketch/attributes/ResizeAttributes.cpp",
2296 "src/dynamic_fusion/sketch/attributes/SoftmaxAttributes.cpp",
2297 "src/dynamic_fusion/sketch/attributes/ReshapeAttributes.cpp",
2298 "src/dynamic_fusion/sketch/gpu/GpuKernelArgument.cpp",
2299 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGraph.cpp",
2300 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGroup.cpp",
2301 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentStream.cpp",
2302 "src/dynamic_fusion/sketch/gpu/GpuLogicalKernel.cpp",
2303 "src/dynamic_fusion/sketch/gpu/GpuOperatorGroup.cpp",
2304 "src/dynamic_fusion/sketch/gpu/GpuWorkloadContext.cpp",
2305 "src/dynamic_fusion/sketch/gpu/GpuWorkloadSketch.cpp",
2306 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentActivation.cpp",
2307 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentCast.cpp",
2308 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDepthwiseConv2d.cpp",
2309 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDirectConv2d.cpp",
2310 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentPool2d.cpp",
2311 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentElementwiseBinary.cpp",
2312 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentLogits1DMaxShiftExpSum.cpp",
2313 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentLogits1DNorm.cpp",
2314 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentReshape.cpp",
2315 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentResize.cpp",
2316 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentStore.cpp",
2317 "src/dynamic_fusion/sketch/gpu/operators/GpuAdd.cpp",
2318 "src/dynamic_fusion/sketch/gpu/operators/GpuCast.cpp",
2319 "src/dynamic_fusion/sketch/gpu/operators/GpuClamp.cpp",
2320 "src/dynamic_fusion/sketch/gpu/operators/GpuConv2d.cpp",
2321 "src/dynamic_fusion/sketch/gpu/operators/GpuDepthwiseConv2d.cpp",
2322 "src/dynamic_fusion/sketch/gpu/operators/GpuMul.cpp",
2323 "src/dynamic_fusion/sketch/gpu/operators/GpuReshape.cpp",
2324 "src/dynamic_fusion/sketch/gpu/operators/GpuPool2d.cpp",
2325 "src/dynamic_fusion/sketch/gpu/operators/GpuOutput.cpp",
2326 "src/dynamic_fusion/sketch/gpu/operators/GpuResize.cpp",
2327 "src/dynamic_fusion/sketch/gpu/operators/GpuSigmoid.cpp",
2328 "src/dynamic_fusion/sketch/gpu/operators/GpuSoftmax.cpp",
2329 "src/dynamic_fusion/sketch/gpu/operators/GpuSub.cpp",
2330 "src/dynamic_fusion/sketch/gpu/operators/GpuTanh.cpp",
2331 "src/dynamic_fusion/sketch/gpu/operators/internal/GpuElementwiseBinaryCommon.cpp"
2332 ],
2333 "template_writer": [
2334 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateActivation.cpp",
2335 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateCast.cpp",
2336 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDepthwiseConv2d.cpp",
2337 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp",
2338 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplatePool2d.cpp",
2339 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateElementwiseBinary.cpp",
2340 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateLogits1DMaxShiftExpSum.cpp",
2341 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateLogits1DNorm.cpp",
2342 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateReshape.cpp",
2343 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateResize.cpp",
2344 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateStore.cpp",
2345 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateWriter.cpp",
2346 "src/dynamic_fusion/sketch/gpu/template_writer/GpuKernelVariableTable.cpp"
2347 ],
2348 "ckw_driver": [
2349 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwComponentArgument.cpp",
2350 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwDriver.cpp",
2351 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwActivation.cpp",
2352 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwCast.cpp",
Jakub Sujake1c96e72023-07-31 13:36:58 +01002353 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwDirectConv2d.cpp",
SiCong Li23882a92023-06-28 09:49:45 +01002354 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwElementwiseBinary.cpp",
Adnan AlSinan2e6d6592023-08-21 13:54:27 +01002355 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwPool2d.cpp",
Gunes Bayir91cb7332023-07-25 17:00:33 +01002356 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwResize.cpp",
SiCong Li23882a92023-06-28 09:49:45 +01002357 "src/dynamic_fusion/sketch/gpu/ckw_driver/components/GpuCkwStore.cpp",
2358 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwKernelWriter.cpp",
2359 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwScopedKernelWriter.cpp",
2360 "src/dynamic_fusion/sketch/gpu/ckw_driver/GpuCkwVariableTable.cpp",
2361 "src/dynamic_fusion/runtime/gpu/cl/ckw_driver/GpuCkwKernelArgumentsHelpers.cpp"
2362 ]
2363 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002364 }
ramelg018a164882022-04-07 02:42:52 +01002365}