blob: 6c5b78f77897d20ed341d23fd60b52b75bc832d3 [file] [log] [blame]
Georgios Pinitasbdcdc392021-04-22 16:42:03 +01001{
Michalis Spyrou20fca522021-06-07 14:23:57 +01002 "common": [
3 "src/common/cpuinfo/CpuInfo.cpp",
4 "src/common/cpuinfo/CpuModel.cpp",
5 "src/common/cpuinfo/CpuIsaInfo.cpp",
6 "src/common/utils/LegacySupport.cpp",
7 "src/common/AllocatorWrapper.cpp",
8 "src/common/ITensorV2.cpp",
Georgios Pinitas41648142021-08-03 08:24:00 +01009 "src/common/TensorPack.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +010010 "src/common/IOperator.cpp",
11 "src/core/AccessWindowAutoPadding.cpp",
12 "src/core/AccessWindowStatic.cpp",
13 "src/core/AccessWindowTranspose.cpp",
14 "src/core/Error.cpp",
15 "src/core/GPUTarget.cpp",
16 "src/core/Helpers.cpp",
17 "src/core/IAccessWindow.cpp",
18 "src/core/IKernel.cpp",
19 "src/core/ITensor.cpp",
20 "src/core/ITensorPack.cpp",
21 "src/core/Rounding.cpp",
22 "src/core/Size2D.cpp",
23 "src/core/SubTensorInfo.cpp",
24 "src/core/TensorInfo.cpp",
25 "src/core/Utils.cpp",
26 "src/core/Validate.cpp",
27 "src/core/Version.cpp",
28 "src/core/helpers/SoftmaxHelpers.cpp",
29 "src/core/helpers/WindowHelpers.cpp",
30 "src/core/utils/AssemblyUtils.cpp",
31 "src/core/utils/ScaleUtils.cpp",
32 "src/core/utils/helpers/fft.cpp",
33 "src/core/utils/helpers/tensor_transform.cpp",
34 "src/core/utils/io/FileHandler.cpp",
35 "src/core/utils/misc/MMappedFile.cpp",
36 "src/core/utils/quantization/AsymmHelpers.cpp",
37 "src/core/CPP/CPPTypes.cpp",
38 "src/core/CPP/kernels/CPPBoxWithNonMaximaSuppressionLimitKernel.cpp",
39 "src/core/CPP/kernels/CPPNonMaximumSuppressionKernel.cpp",
40 "src/core/CPP/kernels/CPPPermuteKernel.cpp",
41 "src/core/CPP/kernels/CPPTopKVKernel.cpp",
42 "src/core/CPP/kernels/CPPUpsampleKernel.cpp",
43 "src/runtime/Allocator.cpp",
44 "src/runtime/BlobLifetimeManager.cpp",
45 "src/runtime/BlobMemoryPool.cpp",
46 "src/runtime/ISimpleLifetimeManager.cpp",
47 "src/runtime/ITensorAllocator.cpp",
48 "src/runtime/IWeightsManager.cpp",
49 "src/runtime/IScheduler.cpp",
50 "src/runtime/Memory.cpp",
51 "src/runtime/MemoryManagerOnDemand.cpp",
52 "src/runtime/OffsetLifetimeManager.cpp",
53 "src/runtime/OffsetMemoryPool.cpp",
54 "src/runtime/OperatorTensor.cpp",
55 "src/runtime/PoolManager.cpp",
56 "src/runtime/RuntimeContext.cpp",
57 "src/runtime/Scheduler.cpp",
58 "src/runtime/SchedulerFactory.cpp",
59 "src/runtime/SchedulerUtils.cpp",
60 "src/runtime/SubTensor.cpp",
61 "src/runtime/Tensor.cpp",
62 "src/runtime/TensorAllocator.cpp",
63 "src/runtime/Utils.cpp",
64 "src/runtime/CPP/ICPPSimpleFunction.cpp",
65 "src/runtime/CPP/functions/CPPBoxWithNonMaximaSuppressionLimit.cpp",
66 "src/runtime/CPP/functions/CPPDetectionOutputLayer.cpp",
67 "src/runtime/CPP/functions/CPPDetectionPostProcessLayer.cpp",
68 "src/runtime/CPP/functions/CPPNonMaximumSuppression.cpp",
69 "src/runtime/CPP/functions/CPPPermute.cpp",
70 "src/runtime/CPP/functions/CPPTopKV.cpp",
71 "src/runtime/CPP/functions/CPPUpsample.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +010072 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +010073 "logging": [
74 "src/core/utils/logging/FilePrinter.cpp",
75 "src/core/utils/logging/Helpers.cpp",
76 "src/core/utils/logging/Logger.cpp",
77 "src/core/utils/logging/LoggerRegistry.cpp"
78 ],
79 "scheduler": {
80 "single": [ "src/runtime/CPP/SingleThreadScheduler.cpp" ],
81 "threads": [ "src/runtime/CPP/CPPScheduler.cpp" ],
82 "omp": [ "src/runtime/OMP/OMPScheduler.cpp"]
83 },
Michalis Spyrou20fca522021-06-07 14:23:57 +010084 "c_api": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +010085 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +010086 "src/c/AclContext.cpp",
Georgios Pinitas06ac6e42021-07-05 08:08:52 +010087 "src/c/AclOperator.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +010088 "src/c/AclQueue.cpp",
89 "src/c/AclTensor.cpp",
90 "src/c/AclTensorPack.cpp",
91 "src/c/AclVersion.cpp"
Georgios Pinitasbdcdc392021-04-22 16:42:03 +010092 ],
Georgios Pinitas13ef1762021-07-14 17:14:43 +010093 "cpu": [
94 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +010095 "gpu": [
96 "src/c/cl/AclOpenClExt.cpp"
Georgios Pinitas41648142021-08-03 08:24:00 +010097 ],
98 "operators":
99 [
100 "src/c/operators/AclActivation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100101 ]
102 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100103 "high_priority": [
104 "Activation",
105 "DepthwiseConv2d",
106 "Conv2d",
107 "Permute",
108 "Pool2d",
SiCong Li83d06742023-05-11 11:54:22 +0100109 "Reshape",
110 "MatMul"
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100111 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100112 "gpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100113 "common": [
114 "src/core/CL/CLCompileContext.cpp",
Giorgio Arenaba2dd822021-07-28 16:10:03 +0100115 "src/core/CL/DefaultLWSHeuristics.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100116 "src/core/CL/CLHelpers.cpp",
117 "src/core/CL/CLKernelLibrary.cpp",
118 "src/core/CL/CLUtils.cpp",
119 "src/core/CL/ICLKernel.cpp",
120 "src/core/CL/ICLSimple2DKernel.cpp",
121 "src/core/CL/ICLSimple3DKernel.cpp",
122 "src/core/CL/ICLSimpleKernel.cpp",
123 "src/core/CL/ICLTensor.cpp",
124 "src/core/CL/OpenCL.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100125 "src/gpu/cl/ClContext.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100126 "src/gpu/cl/ClKernelLibrary.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100127 "src/gpu/cl/ClQueue.cpp",
128 "src/gpu/cl/ClTensor.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100129 "src/core/CL/kernels/CLFillBorderKernel.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100130 "src/runtime/CL/CLBufferAllocator.cpp",
131 "src/runtime/CL/CLGEMMHeuristicsHandle.cpp",
132 "src/runtime/CL/CLHelpers.cpp",
133 "src/runtime/CL/CLMemory.cpp",
134 "src/runtime/CL/CLMemoryRegion.cpp",
135 "src/runtime/CL/CLOperator.cpp",
136 "src/runtime/CL/CLRuntimeContext.cpp",
137 "src/runtime/CL/CLScheduler.cpp",
138 "src/runtime/CL/CLSubTensor.cpp",
139 "src/runtime/CL/CLTensor.cpp",
140 "src/runtime/CL/CLTensorAllocator.cpp",
141 "src/runtime/CL/CLTuner.cpp",
142 "src/runtime/CL/ICLSimpleFunction.cpp",
143 "src/runtime/CL/Utils.cpp",
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100144 "src/runtime/CL/mlgo/HeuristicTree.cpp",
145 "src/runtime/CL/mlgo/MLGOHeuristics.cpp",
146 "src/runtime/CL/mlgo/MLGOParser.cpp",
147 "src/runtime/CL/mlgo/Utils.cpp",
148 "src/runtime/CL/tuners/CLTuningParametersList.cpp"
149 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100150 "operators": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100151 "Activation":{
152 "files": {
153 "common": [
154 "src/gpu/cl/kernels/ClActivationKernel.cpp",
155 "src/gpu/cl/operators/ClActivation.cpp",
156 "src/runtime/CL/functions/CLActivationLayer.cpp"
157 ]
158 }
159 },
160 "ArgMinMax": {
161 "deps": [ "Reshape" ],
162 "files": {
163 "common": [
164 "src/core/CL/kernels/CLArgMinMaxLayerKernel.cpp",
165 "src/runtime/CL/functions/CLArgMinMaxLayer.cpp"
166 ]
167 }
168 },
169 "Add": {
170 "files": {
171 "common": [
172 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
173 "src/gpu/cl/operators/ClAdd.cpp"
174 ]
175 }
176 },
177 "BatchNormalization": {
178 "files": {
179 "common": [
180 "src/core/CL/kernels/CLBatchNormalizationLayerKernel.cpp",
181 "src/core/CL/kernels/CLFuseBatchNormalizationKernel.cpp",
182 "src/runtime/CL/functions/CLBatchNormalizationLayer.cpp",
183 "src/runtime/CL/functions/CLFuseBatchNormalization.cpp"
184 ]
185 }
186 },
187 "BatchToSpace": {
188 "files": {
189 "common": [
190 "src/core/CL/kernels/CLBatchToSpaceLayerKernel.cpp",
191 "src/runtime/CL/functions/CLBatchToSpaceLayer.cpp"
192 ]
193 }
194 },
195 "Bitwise": {
196 "files": {
197 "common": [ "src/core/CL/kernels/CLBitwiseKernel.cpp" ]
198 }
199 },
200 "BitwiseAnd": {
201 "deps": [ "Bitwise" ],
202 "files": {
203 "common": [ "src/runtime/CL/functions/CLBitwiseAnd.cpp" ]
204 }
205 },
206 "BitwiseNot": {
207 "deps": [ "Bitwise" ],
208 "files": {
209 "common": [ "src/runtime/CL/functions/CLBitwiseNot.cpp" ]
210 }
211 },
212 "BitwiseOr": {
213 "deps": [ "Bitwise" ],
214 "files": {
215 "common": [ "src/runtime/CL/functions/CLBitwiseOr.cpp" ]
216 }
217 },
218 "BitwiseXor": {
219 "deps": [ "Bitwise" ],
220 "files": {
221 "common": [ "src/runtime/CL/functions/CLBitwiseXor.cpp" ]
222 }
223 },
224 "BoundingBoxTransform": {
225 "files": {
226 "common": [
227 "src/core/CL/kernels/CLBoundingBoxTransformKernel.cpp",
228 "src/runtime/CL/functions/CLBoundingBoxTransform.cpp"
229 ]
230 }
231 },
232 "Cast": {
233 "files": {
234 "common": [
235 "src/gpu/cl/kernels/ClCastKernel.cpp",
236 "src/gpu/cl/operators/ClCast.cpp",
237 "src/runtime/CL/functions/CLCast.cpp"
238 ]
239 }
240 },
241 "ChannelShuffle": {
242 "files": {
243 "common": [
244 "src/core/CL/kernels/CLChannelShuffleLayerKernel.cpp",
245 "src/runtime/CL/functions/CLChannelShuffleLayer.cpp"
246 ]
247 }
248 },
249 "Comparison": {
250 "files": {
251 "common": [
252 "src/core/CL/kernels/CLComparisonKernel.cpp",
253 "src/runtime/CL/functions/CLComparison.cpp"
254 ]
255 }
256 },
257 "Concatenate": {
258 "files": {
259 "common": [
260 "src/gpu/cl/kernels/ClBatchConcatenateKernel.cpp",
261 "src/gpu/cl/kernels/ClDepthConcatenateKernel.cpp",
262 "src/gpu/cl/kernels/ClHeightConcatenateKernel.cpp",
263 "src/gpu/cl/kernels/ClWidthConcatenate2TensorsKernel.cpp",
264 "src/gpu/cl/kernels/ClWidthConcatenate4TensorsKernel.cpp",
265 "src/gpu/cl/kernels/ClWidthConcatenateKernel.cpp",
266 "src/gpu/cl/operators/ClConcatenate.cpp",
267 "src/runtime/CL/functions/CLConcatenateLayer.cpp"
268 ]
269 }
270 },
271 "Conv2d": {
272 "deps": [
273 "Activation",
274 "ElementwiseBinary",
275 "FFT2D",
276 "Gemm",
277 "Mul",
278 "Pad",
279 "Permute",
280 "Reduction",
281 "Reshape",
282 "Reverse",
283 "Slice"
284 ],
285 "files": {
286 "common": [
287 "src/gpu/cl/kernels/ClDirectConv2dKernel.cpp",
288 "src/gpu/cl/kernels/ClWinogradFilterTransformKernel.cpp",
289 "src/gpu/cl/kernels/ClWinogradInputTransformKernel.cpp",
290 "src/gpu/cl/kernels/ClWinogradOutputTransformKernel.cpp",
291 "src/gpu/cl/kernels/ClIm2ColKernel.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000292 "src/gpu/cl/kernels/ClIndirectConv2dKernel.cpp",
Gian Marco Iodice5d016812022-11-17 11:03:39 +0000293 "src/gpu/cl/kernels/ClIndirectConv2dAddressPrecalculationKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100294 "src/gpu/cl/kernels/ClCol2ImKernel.cpp",
295 "src/gpu/cl/operators/ClConv2d.cpp",
296 "src/gpu/cl/operators/ClDirectConv2d.cpp",
297 "src/gpu/cl/operators/ClGemmConv2d.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000298 "src/gpu/cl/operators/ClIndirectConv2d.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100299 "src/gpu/cl/operators/ClWinogradConv2d.cpp",
300 "src/gpu/cl/kernels/ClWeightsReshapeKernel.cpp",
301 "src/runtime/CL/functions/CLConvolutionLayer.cpp",
302 "src/runtime/CL/functions/CLDirectConvolutionLayer.cpp",
303 "src/runtime/CL/functions/CLFFTConvolutionLayer.cpp",
304 "src/runtime/CL/functions/CLGEMMConvolutionLayer.cpp",
Gian Marco Iodice76335eb2022-11-17 11:03:39 +0000305 "src/runtime/CL/functions/CLIndirectConvolutionLayer.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100306 "src/runtime/CL/functions/CLWinogradConvolutionLayer.cpp"
307 ]
308 }
309 },
Giorgio Arena273c28c2021-10-14 15:59:15 +0100310 "Conv3d": {
311 "files": {
312 "common": [
313 "src/gpu/cl/kernels/ClDirectConv3dKernel.cpp",
314 "src/gpu/cl/operators/ClDirectConv3d.cpp",
315 "src/runtime/CL/functions/CLConv3D.cpp"
316 ]
317 }
318 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100319 "Copy": {
320 "files": {
321 "common": [
322 "src/gpu/cl/kernels/ClCopyKernel.cpp",
323 "src/gpu/cl/operators/ClCopy.cpp",
324 "src/runtime/CL/functions/CLCopy.cpp"
325 ]
326 }
327 },
328 "CropResize": {
329 "deps": [ "Copy", "Fill", "Scale" ],
330 "files": {
331 "common": [
332 "src/gpu/cl/kernels/ClCropKernel.cpp",
333 "src/gpu/cl/operators/ClCrop.cpp",
334 "src/runtime/CL/functions/CLCrop.cpp",
335 "src/runtime/CL/functions/CLCropResize.cpp"
336 ]
337 }
338 },
339 "Deconv2d": {
340 "deps": [ "Conv2d", "Reverse", "Transpose"],
341 "files": {
342 "common": [
343 "src/core/CL/kernels/CLDeconvolutionLayerUpsampleKernel.cpp",
344 "src/core/CL/kernels/CLDeconvolutionReshapeOutputKernel.cpp",
Gunes Bayirec0113d2022-11-09 09:26:27 +0000345 "src/gpu/cl/kernels/ClTransposedConvolutionKernel.cpp",
346 "src/gpu/cl/operators/ClTransposedConvolution.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100347 "src/runtime/CL/functions/CLDeconvolutionLayer.cpp",
348 "src/runtime/CL/functions/CLDeconvolutionLayerUpsample.cpp",
349 "src/runtime/CL/functions/CLDirectDeconvolutionLayer.cpp",
350 "src/runtime/CL/functions/CLGEMMDeconvolutionLayer.cpp"
351 ]
352 }
353 },
354 "DepthConvert": {
355 "deps": [ "Cast"],
356 "files": {
357 "common": [ "src/runtime/CL/functions/CLDepthConvertLayer.cpp" ]
358 }
359 },
360 "DepthToSpace": {
361 "files": {
362 "common": [
363 "src/core/CL/kernels/CLDepthToSpaceLayerKernel.cpp",
364 "src/runtime/CL/functions/CLDepthToSpaceLayer.cpp"
365 ]
366 }
367 },
368 "DepthwiseConv2d": {
369 "deps": [ "Permute" ],
370 "files": {
371 "common": [
372 "src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp",
373 "src/runtime/CL/functions/CLDepthwiseConvolutionLayer.cpp"
374 ]
375 }
376 },
377 "Dequantize": {
378 "files": {
379 "common": [
380 "src/gpu/cl/kernels/ClDequantizeKernel.cpp",
381 "src/gpu/cl/operators/ClDequantize.cpp",
382 "src/runtime/CL/functions/CLDequantizationLayer.cpp"
383 ]
384 }
385 },
386 "ElementwiseBinary": {
387 "deps": ["Add", "Sub"],
388 "files": {
389 "common": [
390 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
391 "src/gpu/cl/operators/ClElementwiseOperations.cpp",
392 "src/runtime/CL/functions/CLElementwiseOperations.cpp"
393 ]
394 }
395 },
396 "ElementwiseUnary":{
397 "files": {
398 "common": [
399 "src/gpu/cl/kernels/ClElementwiseUnaryKernel.cpp",
400 "src/gpu/cl/operators/ClElementwiseUnary.cpp",
401 "src/runtime/CL/functions/CLElementwiseUnaryLayer.cpp"
402 ]
403 }
404 },
405 "FFT1D": {
406 "files": {
407 "common": [
408 "src/core/CL/kernels/CLFFTDigitReverseKernel.cpp",
409 "src/core/CL/kernels/CLFFTRadixStageKernel.cpp",
410 "src/core/CL/kernels/CLFFTScaleKernel.cpp",
411 "src/runtime/CL/functions/CLFFT1D.cpp"
412 ]
413 }
414 },
415 "FFT2D": {
416 "deps": [ "FFT1D" ],
417 "files": {
418 "common": [ "src/runtime/CL/functions/CLFFT2D.cpp" ]
419 }
420 },
421 "Fill": {
422 "files": {
423 "common": [
424 "src/gpu/cl/kernels/ClFillKernel.cpp",
425 "src/gpu/cl/operators/ClFill.cpp",
426 "src/runtime/CL/functions/CLFill.cpp"
427 ]
428 }
429 },
430 "Flatten": {
431 "files": {
432 "common": [
433 "src/gpu/cl/operators/ClFlatten.cpp",
434 "src/runtime/CL/functions/CLFlattenLayer.cpp"
435 ]
436 }
437 },
438 "Floor": {
439 "files": {
440 "common": [
441 "src/gpu/cl/kernels/ClFloorKernel.cpp",
442 "src/gpu/cl/operators/ClFloor.cpp",
443 "src/runtime/CL/functions/CLFloor.cpp"
444 ]
445 }
446 },
447 "FullyConnected": {
448 "deps": [ "Flatten", "Gemm", "Transpose"],
449 "files": {
450 "common": [
451 "src/gpu/cl/kernels/ClConvertFullyConnectedWeightsKernel.cpp",
452 "src/gpu/cl/operators/ClConvertFullyConnectedWeights.cpp",
453 "src/gpu/cl/operators/ClFullyConnected.cpp",
454 "src/runtime/CL/functions/CLConvertFullyConnectedWeights.cpp",
455 "src/runtime/CL/functions/CLFullyConnectedLayer.cpp"
456 ]
457 }
458 },
459 "Gather": {
460 "files": {
461 "common": [
462 "src/core/CL/kernels/CLGatherKernel.cpp",
463 "src/runtime/CL/functions/CLGather.cpp"]
464 }
465 },
466 "Gemm": {
467 "deps": [ "Cast" ],
468 "files": {
469 "common": [
470 "src/gpu/cl/kernels/gemm/ClGemmHelpers.cpp",
471 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeBifrost.cpp",
472 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeMidgard.cpp",
473 "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeValhall.cpp",
474 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedBifrost.cpp",
475 "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedValhall.cpp",
476 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyBifrost.cpp",
477 "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyValhall.cpp",
478 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyNativeKernel.cpp",
479 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedKernel.cpp",
480 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsKernel.cpp",
Freddie Liardete572dff2022-05-16 14:09:10 +0100481 "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100482 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionKernel.cpp",
483 "src/gpu/cl/kernels/ClGemmLowpOffsetContributionOutputStageKernel.cpp",
484 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFixedPointKernel.cpp",
485 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFloatKernel.cpp",
486 "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100487 "src/gpu/cl/kernels/ClGemmMatrixMultiplyNativeKernel.cpp",
Gunes Bayir4bfc70e2021-12-10 16:17:56 +0000488 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100489 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedKernel.cpp",
490 "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsKernel.cpp",
491 "src/gpu/cl/kernels/ClGemmReshapeLhsMatrixKernel.cpp",
492 "src/gpu/cl/kernels/ClGemmReshapeRhsMatrixKernel.cpp",
493 "src/gpu/cl/kernels/ClGemmLowpReductionKernel.cpp",
494 "src/gpu/cl/operators/ClGemm.cpp",
495 "src/gpu/cl/operators/ClGemmLowpMatrixMultiplyCore.cpp",
496 "src/gpu/cl/operators/ClGemmLowpOutputStage.cpp",
497 "src/runtime/CL/gemm/CLGEMMDefaultTypeBifrost.cpp",
498 "src/runtime/CL/gemm/CLGEMMDefaultTypeMidgard.cpp",
499 "src/runtime/CL/gemm/CLGEMMDefaultTypeValhall.cpp",
500 "src/runtime/CL/gemm_auto_heuristics/CLGEMMAutoHeuristics.cpp",
501 "src/runtime/CL/functions/CLGEMM.cpp",
502 "src/runtime/CL/functions/CLGEMMLowpMatrixMultiplyCore.cpp",
Ramy Elgammaldf6a3b02022-11-30 16:23:10 +0000503 "src/runtime/CL/functions/CLGEMMLowpOutputStage.cpp",
504 "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigBifrost.cpp",
Gian Marco Iodicea5cb79f2022-12-28 13:53:51 +0000505 "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigValhall.cpp",
Gian Marco Iodice9d3bd412022-12-30 09:45:00 +0000506 "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigBifrost.cpp",
507 "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigValhall.cpp",
508 "src/runtime/heuristics/dwc_native/ClDWCNativeHeuristicsHelpers.cpp",
Ramy Elgammal34a95d12023-05-11 18:23:44 +0100509 "src/runtime/heuristics/indirect_conv/ClIndirectConvDefaultConfigValhall.cpp"
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100510 ]
511 }
512 },
Ramy Elgammal2b6ebfe2023-03-09 21:15:37 +0000513 "MatMul": {
514 "files": {
515 "common": [
Gunes Bayir9d0c4de2023-04-13 18:22:58 +0100516 "src/gpu/cl/kernels/ClMatMulLowpNativeKernel.cpp",
Jakub Sujak1ed6a142023-04-13 21:14:42 +0100517 "src/gpu/cl/kernels/ClMatMulNativeKernel.cpp",
Ramy Elgammalf26ea2f2023-03-24 11:42:03 +0000518 "src/gpu/cl/operators/ClMatMul.cpp",
Ramy Elgammal34a95d12023-05-11 18:23:44 +0100519 "src/runtime/CL/functions/CLMatMul.cpp",
520 "src/runtime/heuristics/matmul_native/ClMatMulNativeDefaultConfigValhall.cpp",
521 "src/runtime/heuristics/matmul_native/ClMatMulNativeHelpers.cpp"
Ramy Elgammal2b6ebfe2023-03-09 21:15:37 +0000522 ]
523 }
524 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100525 "GenerateProposals": {
526 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
527 "files": {
528 "common": [
529 "src/core/CL/kernels/CLGenerateProposalsLayerKernel.cpp",
530 "src/runtime/CL/functions/CLGenerateProposalsLayer.cpp"
531 ]
532 }
533 },
534 "InstanceNormalize": {
535 "files": {
536 "common": [
537 "src/core/CL/kernels/CLInstanceNormalizationLayerKernel.cpp",
538 "src/runtime/CL/functions/CLInstanceNormalizationLayer.cpp"
539 ]
540 }
541 },
542 "L2Normalize": {
543 "deps": [ "Reduction" ],
544 "files": {
545 "common": [
546 "src/core/CL/kernels/CLL2NormalizeLayerKernel.cpp",
547 "src/runtime/CL/functions/CLL2NormalizeLayer.cpp"
548 ]
549 }
550 },
551 "Logical": {
552 "files": {
553 "common": [
554 "src/gpu/cl/operators/ClLogicalNot.cpp",
555 "src/runtime/CL/functions/CLLogicalAnd.cpp",
556 "src/runtime/CL/functions/CLLogicalNot.cpp",
557 "src/runtime/CL/functions/CLLogicalOr.cpp"
558 ]
559 }
560 },
561 "LSTM": {
562 "deps": [
563 "Activation",
564 "Concatenate",
565 "Copy",
566 "Dequantize",
567 "ElementwiseBinary",
568 "Fill",
569 "FullyConnected",
570 "Gemm",
571 "MeanStdDevNormalize",
572 "Mul",
573 "Quantize",
574 "Slice",
575 "Transpose"
576 ],
577 "files": {
578 "common": [
579 "src/core/CL/kernels/CLQLSTMLayerNormalizationKernel.cpp",
580 "src/runtime/CL/functions/CLQLSTMLayer.cpp",
581 "src/runtime/CL/functions/CLLSTMLayer.cpp",
582 "src/runtime/CL/functions/CLLSTMLayerQuantized.cpp"
583 ]
584 }
585 },
586 "MaxUnpool2d": {
587 "deps": [ "Fill" ],
588 "files": {
589 "common": [
590 "src/core/CL/kernels/CLMaxUnpoolingLayerKernel.cpp",
591 "src/runtime/CL/functions/CLMaxUnpoolingLayer.cpp"
592 ]
593 }
594 },
595 "MeanStdDevNormalize": {
596 "deps": [ "Reduction" ],
597 "files": {
598 "common": [
599 "src/core/CL/kernels/CLMeanStdDevNormalizationKernel.cpp",
600 "src/runtime/CL/functions/CLMeanStdDevNormalizationLayer.cpp",
601 "src/runtime/CL/functions/CLReduceMean.cpp"
602 ]
603 }
604 },
605 "Mul": {
606 "files": {
607 "common": [
608 "src/gpu/cl/kernels/ClMulKernel.cpp",
609 "src/gpu/cl/operators/ClMul.cpp",
610 "src/runtime/CL/functions/CLPixelWiseMultiplication.cpp"
611 ]
612 }
613 },
614 "Normalize": {
615 "files": {
616 "common": [
617 "src/core/CL/kernels/CLNormalizationLayerKernel.cpp",
618 "src/runtime/CL/functions/CLNormalizationLayer.cpp"
619 ]
620 }
621 },
622 "Pad": {
623 "deps": [ "Copy" ],
624 "files": {
625 "common": [
626 "src/core/CL/kernels/CLPadLayerKernel.cpp",
627 "src/runtime/CL/functions/CLPadLayer.cpp"
628 ]
629 }
630 },
631 "Permute": {
632 "files": {
633 "common": [
634 "src/gpu/cl/kernels/ClPermuteKernel.cpp",
635 "src/gpu/cl/operators/ClPermute.cpp",
636 "src/runtime/CL/functions/CLPermute.cpp"
637 ]
638 }
639 },
640 "Pool2d": {
641 "files": {
642 "common": [
643 "src/gpu/cl/kernels/ClPool2dKernel.cpp",
644 "src/gpu/cl/operators/ClPool2d.cpp",
645 "src/runtime/CL/functions/CLPoolingLayer.cpp"
646 ]
647 }
648 },
ramelg0137515692022-02-26 22:06:20 +0000649 "Pool3d": {
650 "files": {
651 "common": [
652 "src/gpu/cl/kernels/ClPool3dKernel.cpp",
653 "src/gpu/cl/operators/ClPool3d.cpp",
654 "src/runtime/CL/functions/CLPooling3dLayer.cpp"
655 ]
656 }
657 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100658 "PRelu": {
659 "deps": [ "ElementwiseBinary" ],
660 "files": {
661 "common": [
662 "src/gpu/cl/operators/ClPRelu.cpp",
663 "src/runtime/CL/functions/CLPReluLayer.cpp"
664 ]
665 }
666 },
667 "PriorBox": {
668 "files": {
669 "common": [
670 "src/core/CL/kernels/CLPriorBoxLayerKernel.cpp",
671 "src/runtime/CL/functions/CLPriorBoxLayer.cpp"
672 ]
673 }
674 },
675 "Quantize": {
676 "files": {
677 "common": [
678 "src/gpu/cl/kernels/ClQuantizeKernel.cpp",
679 "src/gpu/cl/operators/ClQuantize.cpp",
680 "src/runtime/CL/functions/CLQuantizationLayer.cpp"
681 ]
682 }
683 },
684 "Range": {
685 "files": {
686 "common": [
687 "src/core/CL/kernels/CLRangeKernel.cpp",
688 "src/runtime/CL/functions/CLRange.cpp"
689 ]
690 }
691 },
692 "Reduction": {
693 "deps": [ "Reshape" ],
694 "files": {
ramelg01a1f78512022-06-29 16:28:10 +0100695 "common": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100696 "src/core/CL/kernels/CLReductionOperationKernel.cpp",
697 "src/runtime/CL/functions/CLReductionOperation.cpp"
698 ]
699 }
700 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100701 "Reorg": {
702 "files": {
703 "common": [
704 "src/core/CL/kernels/CLReorgLayerKernel.cpp",
705 "src/runtime/CL/functions/CLReorgLayer.cpp"
706 ]
707 }
708 },
709 "Reshape": {
710 "files": {
711 "common": [
712 "src/gpu/cl/kernels/ClReshapeKernel.cpp",
713 "src/gpu/cl/operators/ClReshape.cpp",
714 "src/runtime/CL/functions/CLReshapeLayer.cpp"
715 ]
716 }
717 },
718 "Reverse": {
719 "files": {
720 "common": [
721 "src/core/CL/kernels/CLReverseKernel.cpp",
722 "src/runtime/CL/functions/CLReverse.cpp"
723 ]
724 }
725 },
726 "RNN": {
727 "deps": [ "Activation", "Cast", "ElementwiseBinary", "FullyConnected", "Gemm"],
728 "files": {
729 "common": [ "src/runtime/CL/functions/CLRNNLayer.cpp" ]
730 }
731 },
732 "ROIAlign": {
733 "files": {
734 "common": [
735 "src/core/CL/kernels/CLROIAlignLayerKernel.cpp",
736 "src/runtime/CL/functions/CLROIAlignLayer.cpp"
737 ]
738 }
739 },
740 "ROIPool2d": {
741 "files": {
742 "common": [
743 "src/core/CL/kernels/CLROIPoolingLayerKernel.cpp",
744 "src/runtime/CL/functions/CLROIPoolingLayer.cpp"
745 ]
746 }
747 },
748 "Scale": {
749 "files": {
750 "common": [
751 "src/gpu/cl/kernels/ClScaleKernel.cpp",
752 "src/gpu/cl/operators/ClScale.cpp",
753 "src/runtime/CL/functions/CLScale.cpp"
754 ]
755 }
756 },
757 "Select": {
758 "files": {
759 "common": [
760 "src/core/CL/kernels/CLSelectKernel.cpp",
761 "src/runtime/CL/functions/CLSelect.cpp"
762 ]
763 }
764 },
765 "Slice": {
766 "deps": [ "StridedSlice" ],
767 "files": {
768 "common": [ "src/runtime/CL/functions/CLSlice.cpp" ]
769 }
770 },
771 "Softmax": {
772 "deps": [ "Permute" ],
773 "files": {
774 "common": [
775 "src/gpu/cl/kernels/ClSoftmaxKernel.cpp",
776 "src/gpu/cl/operators/ClSoftmax.cpp",
777 "src/runtime/CL/functions/CLSoftmaxLayer.cpp"
778 ]
779 }
780 },
781 "SpaceToBatch": {
782 "files": {
783 "common": [
784 "src/core/CL/kernels/CLSpaceToBatchLayerKernel.cpp",
785 "src/runtime/CL/functions/CLSpaceToBatchLayer.cpp"
786 ]
787 }
788 },
789 "SpaceToDepth": {
790 "files": {
791 "common": [
792 "src/core/CL/kernels/CLSpaceToDepthLayerKernel.cpp",
793 "src/runtime/CL/functions/CLSpaceToDepthLayer.cpp"
794 ]
795 }
796 },
797 "Split": {
798 "deps": [ "StridedSlice" ],
799 "files": {
800 "common": [ "src/runtime/CL/functions/CLSplit.cpp" ]
801 }
802 },
803 "Stack": {
804 "files": {
805 "common": [
806 "src/core/CL/kernels/CLStackLayerKernel.cpp",
807 "src/runtime/CL/functions/CLStackLayer.cpp"
808 ]
809 }
810 },
811 "StridedSlice": {
812 "files": {
813 "common": [
814 "src/core/CL/kernels/CLStridedSliceKernel.cpp",
815 "src/runtime/CL/functions/CLStridedSlice.cpp"
816 ]
817 }
818 },
819 "Sub": {
820 "files": {
821 "common": [
822 "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
823 "src/gpu/cl/operators/ClSub.cpp"
824 ]
825 }
826 },
827 "Tile": {
828 "files": {
829 "common": [
830 "src/core/CL/kernels/CLTileKernel.cpp",
831 "src/runtime/CL/functions/CLTile.cpp"
832 ]
833 }
834 },
835 "Transpose": {
836 "files": {
837 "common": [
838 "src/gpu/cl/kernels/ClTransposeKernel.cpp",
839 "src/gpu/cl/operators/ClTranspose.cpp",
840 "src/runtime/CL/functions/CLTranspose.cpp"
841 ]
842 }
843 },
844 "Unstack": {
845 "deps": [ "StridedSlice" ],
846 "files": {
847 "common": [ "src/runtime/CL/functions/CLUnstack.cpp" ]
848 }
849 },
850 "YUVNormalize": {
851 "files": {
852 "common": [
853 "src/core/CL/kernels/CLNormalizePlanarYUVLayerKernel.cpp",
854 "src/runtime/CL/functions/CLNormalizePlanarYUVLayer.cpp"
855 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100856 }
Georgios Pinitasbdcdc392021-04-22 16:42:03 +0100857 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100858 }
859},
Michalis Spyrou20fca522021-06-07 14:23:57 +0100860 "cpu": {
Georgios Pinitas13ef1762021-07-14 17:14:43 +0100861 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +0100862 "src/cpu/CpuContext.cpp",
863 "src/cpu/CpuQueue.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100864 "src/cpu/CpuTensor.cpp",
865 "src/core/NEON/kernels/NEFillBorderKernel.cpp",
866 "src/runtime/NEON/INEOperator.cpp",
867 "src/runtime/NEON/INESimpleFunction.cpp",
868 "src/runtime/NEON/INESimpleFunctionNoBorder.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100869 ],
870 "operators": {
871 "Activation": {
Viet-Hoa Dofd472f02023-03-15 14:05:06 +0000872 "deps": [ "LUT" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100873 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100874 "common": [
875 "src/cpu/operators/CpuActivation.cpp",
876 "src/cpu/kernels/CpuActivationKernel.cpp",
Dana Zlotnika538ae52022-02-21 13:12:41 +0200877 "src/runtime/NEON/functions/NEActivationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100878 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100879 "neon": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200880 "fp16": [ "src/cpu/kernels/activation/generic/neon/fp16.cpp" ],
ramelg01c827e992022-04-08 03:52:28 +0100881 "fp32": [ "src/cpu/kernels/activation/generic/neon/fp32.cpp" ],
Viet-Hoa Do29db3d22022-08-10 11:56:49 +0100882 "qasymm8": [
883 "src/cpu/kernels/activation/generic/neon/qasymm8.cpp",
884 "src/cpu/kernels/activation/generic/neon/lut.cpp"
885 ],
886 "qasymm8_signed": [
887 "src/cpu/kernels/activation/generic/neon/qasymm8_signed.cpp",
888 "src/cpu/kernels/activation/generic/neon/lut.cpp"
889 ],
Dana Zlotnika538ae52022-02-21 13:12:41 +0200890 "qsymm16": [ "src/cpu/kernels/activation/generic/neon/qsymm16.cpp" ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100891 },
892 "sve": {
Dana Zlotnik32291712021-11-25 09:58:27 +0200893 "fp16": [ "src/cpu/kernels/activation/generic/sve/fp16.cpp" ],
SiCong Lic0463a22023-05-17 13:46:13 +0100894 "fp32": [ "src/cpu/kernels/activation/generic/sve/fp32.cpp" ]
ramelg01c827e992022-04-08 03:52:28 +0100895 },
alerah01c9e519d2022-01-31 19:04:10 +0200896 "sve2":{
SiCong Lic0463a22023-05-17 13:46:13 +0100897 "qasymm8": [
898 "src/cpu/kernels/activation/generic/sve2/qasymm8.cpp",
899 "src/cpu/kernels/activation/generic/sve2/lut.cpp"
900 ],
Dana Zlotnik32291712021-11-25 09:58:27 +0200901 "qasymm8_signed": [ "src/cpu/kernels/activation/generic/sve2/qasymm8_signed.cpp" ],
902 "qsymm16": [ "src/cpu/kernels/activation/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100903 }
904 }
905 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100906 "ArgMinMax": {
907 "deps": [ "Reduction" ],
908 "files": {
909 "common": [ "src/runtime/NEON/functions/NEArgMinMaxLayer.cpp" ]
910 }
911 },
Michalis Spyrou20fca522021-06-07 14:23:57 +0100912 "Add": {
913 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100914 "common": [
915 "src/cpu/operators/CpuAdd.cpp",
916 "src/cpu/kernels/CpuAddKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200917 "src/runtime/NEON/functions/NEArithmeticAddition.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100918 ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200919 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200920 "common": ["src/cpu/kernels/add/generic/neon/impl.cpp"],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200921 "fp32":["src/cpu/kernels/add/generic/neon/fp32.cpp"],
922 "fp16":["src/cpu/kernels/add/generic/neon/fp16.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200923 "integer":["src/cpu/kernels/add/generic/neon/integer.cpp"],
924 "qasymm8": ["src/cpu/kernels/add/generic/neon/qasymm8.cpp"],
925 "qasymm8_signed": ["src/cpu/kernels/add/generic/neon/qasymm8_signed.cpp"],
926 "qsymm16": ["src/cpu/kernels/add/generic/neon/qsymm16.cpp"]
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200927 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100928 "sve": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200929 "common": [ "src/cpu/kernels/add/generic/sve/impl.cpp" ],
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200930 "integer":["src/cpu/kernels/add/generic/sve/integer.cpp"],
Motti Gondabi9d9ad332022-01-23 12:42:24 +0200931 "fp32":["src/cpu/kernels/add/generic/sve/fp32.cpp"],
932 "fp16":["src/cpu/kernels/add/generic/sve/fp16.cpp"]
933 },
934 "sve2": {
Dana Zlotnikbd2942d2021-11-15 08:46:04 +0200935 "qasymm8": [ "src/cpu/kernels/add/generic/sve2/qasymm8.cpp" ],
936 "qasymm8_signed": [ "src/cpu/kernels/add/generic/sve2/qasymm8_signed.cpp" ],
937 "qsymm16": [ "src/cpu/kernels/add/generic/sve2/qsymm16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100938 }
939 }
940 },
Gunes Bayirae72a462023-01-29 13:24:24 +0000941 "AddMulAdd": {
942 "files": {
943 "common": [
944 "src/cpu/operators/CpuAddMulAdd.cpp",
945 "src/cpu/kernels/CpuAddMulAddKernel.cpp",
946 "src/runtime/NEON/functions/NEAddMulAdd.cpp"
947 ],
948 "neon": {
949 "fp32":["src/cpu/kernels/addmuladd/generic/neon/fp32.cpp"],
950 "fp16":["src/cpu/kernels/addmuladd/generic/neon/fp16.cpp"],
951 "qasymm8": ["src/cpu/kernels/addmuladd/generic/neon/qasymm8.cpp"],
952 "qasymm8_signed": ["src/cpu/kernels/addmuladd/generic/neon/qasymm8_signed.cpp"]
953 }
954 }
955 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100956 "BatchNormalize": {
Michalis Spyrou20fca522021-06-07 14:23:57 +0100957 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100958 "common": [
959 "src/core/NEON/kernels/NEBatchNormalizationLayerKernel.cpp",
960 "src/core/NEON/kernels/NEFuseBatchNormalizationKernel.cpp",
961 "src/runtime/NEON/functions/NEBatchNormalizationLayer.cpp",
962 "src/runtime/NEON/functions/NEFuseBatchNormalization.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100963 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +0100964 "neon": {
Yair Schwarzbaum41a729e2021-11-15 20:42:47 +0200965 "common": [
966 "src/cpu/kernels/fuse_batch_normalization/generic/impl.cpp",
967 "src/cpu/kernels/fuse_batch_normalization/nchw/all.cpp",
968 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/impl.cpp"
969 ],
970 "fp16": [
971 "src/cpu/kernels/fuse_batch_normalization/generic/fp16.cpp",
972 "src/core/NEON/kernels/batchnormalization/impl/NEON/fp16.cpp",
973 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp16.cpp"
974 ],
975 "fp32": [
976 "src/cpu/kernels/fuse_batch_normalization/generic/fp32.cpp",
977 "src/core/NEON/kernels/batchnormalization/impl/NEON/fp32.cpp",
978 "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp32.cpp"
979 ]
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100980 },
981 "sve": {
982 "fp16": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp16.cpp" ],
983 "fp32": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp32.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +0100984 }
985 }
986 },
987 "BatchToSpace": {
988 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100989 "common": [
990 "src/core/NEON/kernels/NEBatchToSpaceLayerKernel.cpp",
991 "src/runtime/NEON/functions/NEBatchToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +0100992 ]
993 }
994 },
995 "BitwiseAnd": {
996 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +0100997 "common": [
998 "src/core/NEON/kernels/NEBitwiseAndKernel.cpp",
999 "src/runtime/NEON/functions/NEBitwiseAnd.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001000 ]
1001 }
1002 },
1003 "BitwiseNot": {
1004 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001005 "common": [
1006 "src/core/NEON/kernels/NEBitwiseNotKernel.cpp",
1007 "src/runtime/NEON/functions/NEBitwiseNot.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001008 ]
1009 }
1010 },
1011 "BitwiseOr": {
1012 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001013 "common": [
1014 "src/core/NEON/kernels/NEBitwiseOrKernel.cpp",
1015 "src/runtime/NEON/functions/NEBitwiseOr.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001016 ]
1017 }
1018 },
1019 "BitwiseXor": {
1020 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001021 "common": [
1022 "src/core/NEON/kernels/NEBitwiseXorKernel.cpp",
1023 "src/runtime/NEON/functions/NEBitwiseXor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001024 ]
1025 }
1026 },
1027 "BoundingBoxTransform": {
1028 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001029 "common": [
1030 "src/core/NEON/kernels/NEBoundingBoxTransformKernel.cpp",
1031 "src/runtime/NEON/functions/NEBoundingBoxTransform.cpp"
Dana Zlotnik3475ffe2022-01-03 14:37:10 +02001032 ],
1033 "neon":{
1034 "common":["src/cpu/kernels/boundingboxtransform/generic/neon/impl.cpp"],
1035 "fp32":["src/cpu/kernels/boundingboxtransform/generic/neon/fp32.cpp"],
1036 "fp16":["src/cpu/kernels/boundingboxtransform/generic/neon/fp16.cpp"],
1037 "qsymm16":["src/cpu/kernels/boundingboxtransform/generic/neon/qsymm16.cpp"]
Dana Zlotnik3475ffe2022-01-03 14:37:10 +02001038 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001039 }
1040 },
1041 "Cast": {
1042 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001043 "common": [
1044 "src/cpu/operators/CpuCast.cpp",
1045 "src/cpu/kernels/CpuCastKernel.cpp",
Yair Schwarzbaum298b2c02022-02-01 08:55:56 +02001046 "src/runtime/NEON/functions/NECast.cpp",
1047 "src/cpu/kernels/cast/generic/neon/bfloat16.cpp"
1048 ],
1049 "neon":{
1050 "fp16":["src/cpu/kernels/cast/generic/neon/fp16.cpp"]
1051 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001052 }
1053 },
1054 "ChannelShuffle": {
1055 "files": {
1056 "common": [
1057 "src/core/NEON/kernels/NEChannelShuffleLayerKernel.cpp",
1058 "src/runtime/NEON/functions/NEChannelShuffleLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001059 ]
1060 }
1061 },
1062 "Concatenate": {
1063 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001064 "common": [
1065 "src/cpu/operators/CpuConcatenate.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001066 "src/cpu/kernels/CpuConcatenateWidthKernel.cpp",
1067 "src/cpu/kernels/CpuConcatenateBatchKernel.cpp",
1068 "src/cpu/kernels/CpuConcatenateDepthKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001069 "src/cpu/kernels/CpuConcatenateHeightKernel.cpp",
1070 "src/runtime/NEON/functions/NEConcatenateLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001071 ]
1072 }
1073 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001074 "Conv2d": {
1075 "deps": [
1076 "Activation",
1077 "ElementwiseBinary",
1078 "FFT2D",
1079 "Gemm",
1080 "Mul",
1081 "Pad",
1082 "Permute",
1083 "Reshape",
1084 "Reverse",
1085 "Slice"
1086 ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001087 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001088 "common": [
1089 "src/cpu/operators/CpuConv2d.cpp",
1090 "src/cpu/operators/CpuDirectConv2d.cpp",
1091 "src/cpu/operators/CpuGemmDirectConv2d.cpp",
1092 "src/cpu/operators/CpuGemmConv2d.cpp",
1093 "src/cpu/operators/CpuWinogradConv2d.cpp",
1094 "src/cpu/operators/internal/CpuGemmAssemblyDispatch.cpp",
1095 "src/cpu/kernels/CpuDirectConv2dKernel.cpp",
1096 "src/cpu/kernels/CpuDirectConv2dOutputStageKernel.cpp",
1097 "src/cpu/kernels/CpuWinogradConv2dKernel.cpp",
1098 "src/cpu/kernels/CpuCol2ImKernel.cpp",
1099 "src/cpu/kernels/CpuIm2ColKernel.cpp",
1100 "src/cpu/kernels/CpuWeightsReshapeKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001101 "src/runtime/NEON/functions/NEConvolutionLayer.cpp",
1102 "src/runtime/NEON/functions/NEDirectConvolutionLayer.cpp",
1103 "src/runtime/NEON/functions/NEFFTConvolutionLayer.cpp",
1104 "src/runtime/NEON/functions/NEGEMMConv2d.cpp",
1105 "src/runtime/NEON/functions/NEGEMMConvolutionLayer.cpp",
1106 "src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001107 ],
1108 "neon": {
1109 "common": [
1110 "src/core/NEON/kernels/convolution/common/padding.cpp",
1111 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1112 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1113 "src/core/NEON/kernels/convolution/common/utils.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001114 "src/core/NEON/kernels/convolution/winograd/input_transforms_fp16.cpp",
1115 "src/core/NEON/kernels/convolution/winograd/input_transforms_fp32.cpp",
1116 "src/core/NEON/kernels/convolution/winograd/output_transforms_fp16.cpp",
1117 "src/core/NEON/kernels/convolution/winograd/output_transforms_fp32.cpp",
1118 "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp16.cpp",
1119 "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp32.cpp",
1120 "src/core/NEON/kernels/convolution/winograd/winograd_fp16.cpp",
1121 "src/core/NEON/kernels/convolution/winograd/winograd_fp32.cpp",
1122 "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp16_6x6.cpp",
1123 "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp32_6x6.cpp",
1124 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_1x8.cpp",
1125 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_4x4.cpp",
1126 "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_6x6.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001127 "src/core/NEON/kernels/convolution/winograd/output_transforms/a64_fp16_4x4_3x3.cpp",
1128 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x2_1x7.cpp",
1129 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x4_1x5.cpp",
1130 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x6_1x3.cpp",
1131 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_3x3.cpp",
1132 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_5x5.cpp",
1133 "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_4x4_3x3.cpp",
1134 "src/core/NEON/kernels/convolution/winograd/weight_transforms/a64_fp16_4x4_3x3.cpp",
1135 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_3x3.cpp",
1136 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_5x5.cpp",
1137 "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_4x4_3x3.cpp",
1138 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x2_1x7.cpp",
1139 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x4_1x5.cpp",
1140 "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x6_1x3.cpp",
alerah01c9e519d2022-01-31 19:04:10 +02001141 "src/cpu/kernels/directconv2d/nhwc/neon/impl.cpp",
1142 "src/cpu/kernels/directconv2d/nchw/all.cpp"
1143 ],
1144 "fp32": [
1145 "src/cpu/kernels/directconv2d/nhwc/neon/fp32.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001146 ]
ramelg0199c46472022-07-15 13:08:39 +01001147 },
1148 "sve": {
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001149 "common": [
1150 "src/core/NEON/kernels/convolution/winograd/input_transforms/sve_fp32_6x6.cpp",
1151 "src/core/NEON/kernels/convolution/winograd/input_transforms/sme_fp32_mla_6x6.cpp",
1152 "src/core/NEON/kernels/convolution/winograd/output_transforms/sme_fp32_mopa_4x4_3x3.cpp"
1153 ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001154 }
Michalis Spyroub55f8e82021-07-22 11:23:11 +01001155 }
1156 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001157 "Copy": {
1158 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001159 "common": [
1160 "src/cpu/operators/CpuCopy.cpp",
1161 "src/cpu/kernels/CpuCopyKernel.cpp",
1162 "src/runtime/NEON/functions/NECopy.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001163 ]
1164 }
1165 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001166 "CropResize": {
1167 "deps": [ "Scale" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001168 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001169 "common": [
1170 "src/core/NEON/kernels/NECropKernel.cpp",
1171 "src/runtime/NEON/functions/NECropResize.cpp"
alerah0127619932021-11-24 17:21:43 +02001172 ],
1173 "neon": {
1174 "common": [ "src/cpu/kernels/crop/generic/neon/impl.cpp" ],
1175 "fp32": [ "src/cpu/kernels/crop/generic/neon/fp32.cpp" ],
1176 "fp16": [ "src/cpu/kernels/crop/generic/neon/fp16.cpp" ],
1177 "integer": [ "src/cpu/kernels/crop/generic/neon/integer.cpp" ]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001178 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001179 }
1180 },
1181 "Deconv2d": {
1182 "deps": [ "Conv2d", "Reverse", "Transpose"],
1183 "files": {
1184 "common": [
1185 "src/runtime/NEON/functions/NEDeconvolutionLayer.cpp"
1186 ]
1187 }
1188 },
1189 "DepthConvert": {
1190 "deps": [ "Cast"],
1191 "files": {
1192 "common": [
1193 "src/runtime/NEON/functions/NEDepthConvertLayer.cpp"
1194 ]
1195 }
1196 },
1197 "DepthToSpace": {
1198 "files": {
1199 "common": [
1200 "src/core/NEON/kernels/NEDepthToSpaceLayerKernel.cpp",
1201 "src/runtime/NEON/functions/NEDepthToSpaceLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001202 ]
1203 }
1204 },
1205 "DepthwiseConv2d": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001206 "deps": [ "Activation", "Permute" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001207 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001208 "common": [
Georgios Pinitas7891a732021-08-20 21:39:25 +01001209 "src/cpu/operators/CpuDepthwiseConv2d.cpp",
1210 "src/cpu/operators/CpuDepthwiseConv2dAssemblyDispatch.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001211 "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.cpp",
1212 "src/cpu/kernels/internal/CpuDepthwiseConv2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001213 "src/runtime/NEON/functions/NEDepthwiseConvolutionLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001214 ],
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001215 "neon": {
1216 "common": [
1217 "src/core/NEON/kernels/convolution/common/padding.cpp",
1218 "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1219 "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1220 "src/core/NEON/kernels/convolution/common/utils.cpp",
ramelg01c827e992022-04-08 03:52:28 +01001221 "src/core/NEON/kernels/arm_conv/addressing.cpp",
Pablo Marquez Tello4e2bbbb2023-01-09 17:21:01 +00001222 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_common.cpp",
ramelg018a164882022-04-07 02:42:52 +01001223 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_strategies_common.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001224 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8q.cpp",
1225 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8s8u8q.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001226 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_s8q.cpp",
1227 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp32.cpp",
1228 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1229 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1230 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1231 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1232 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1233 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1234 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1235 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1236 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1237 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1238 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
ramelg018a164882022-04-07 02:42:52 +01001239 "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp16.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001240 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1241 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1242 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1243 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1244 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1245 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1246 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1247 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1248 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1249 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1250 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1251 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1252 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1253 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1254 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1255 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1256 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1257 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1258 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1259 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1260 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1261 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1262 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1263 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1264 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1265 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1266 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1267 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1268 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1269 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1270 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1271 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1272 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1273 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1274 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1275 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1276 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
ramelg018a164882022-04-07 02:42:52 +01001277 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1278 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1279 "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001280 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_s8q_3x3_dot.cpp",
ramelg01c827e992022-04-08 03:52:28 +01001281 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_u8q_3x3_dot.cpp",
ramelg018a164882022-04-07 02:42:52 +01001282 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic.cpp",
1283 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic_quantized_dot_product.cpp",
Dana Zlotnikebbae942022-02-03 12:52:15 +02001284 "src/cpu/kernels/depthwiseconv2d/generic/neon/impl.cpp"
ramelg01a1f78512022-06-29 16:28:10 +01001285 ],
Dana Zlotnikebbae942022-02-03 12:52:15 +02001286 "fp16":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp16.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01001287 "fp32":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp32.cpp"],
1288 "qasymm8":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8.cpp"],
Dana Zlotnikebbae942022-02-03 12:52:15 +02001289 "qasymm8_signed":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8_signed.cpp"]
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001290 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001291 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001292 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001293 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_s8q_3x3_dot.cpp",
1294 "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_u8q_3x3_dot.cpp",
1295 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1296 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1297 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1298 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1299 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1300 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1301 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1302 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1303 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1304 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001305 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1306 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001307 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1308 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1309 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1310 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1311 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1312 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1313 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1314 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1315 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1316 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1317 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1318 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1319 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1320 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1321 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1322 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1323 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1324 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1325 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1326 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1327 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1328 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1329 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1330 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1331 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1332 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1333 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001334 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
David Mansellb2758f32023-03-30 19:10:52 +01001335 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1336 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1337 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1338 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1339 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1340 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1341 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1342 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1343 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1344 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001345 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1346 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1347 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1348 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1349 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1350 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1351 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1352 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1353 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s1_4rows_mla_za/generic.cpp",
1354 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s2_4rows_mla_za/generic.cpp",
1355 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s1_4rows_mla_za/generic.cpp",
1356 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s2_4rows_mla_za/generic.cpp",
1357 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za/generic.cpp",
1358 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za/generic.cpp",
1359 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za/generic.cpp",
1360 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za/generic.cpp",
1361 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001362 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1363 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1364 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1365 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001366 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1367 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1368 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1369 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001370 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1371 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1372 "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001373 ]
1374 }
1375 }
1376 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001377 "Dequantize": {
1378 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001379 "common": [
1380 "src/cpu/operators/CpuDequantize.cpp",
1381 "src/cpu/kernels/CpuDequantizeKernel.cpp",
1382 "src/runtime/NEON/functions/NEDequantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001383 ]
1384 }
1385 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001386 "DetectionPostProcess": {
1387 "deps": [ "Dequantize" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001388 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001389 "common" : [ "src/runtime/NEON/functions/NEDetectionPostProcessLayer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001390 }
1391 },
Sheri Zhang6d9c9822021-09-24 16:02:57 +01001392 "Conv3d": {
1393 "deps": [
1394 "Activation"
1395 ],
1396 "files": {
1397 "common": [
1398 "src/cpu/operators/CpuDirectConv3d.cpp",
1399 "src/cpu/kernels/CpuDirectConv3dKernel.cpp",
1400 "src/runtime/NEON/functions/NEConv3D.cpp"
1401 ]
1402 }
1403 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001404 "ElementwiseBinary": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001405 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001406 "common": [
1407 "src/cpu/operators/CpuElementwise.cpp",
1408 "src/cpu/kernels/CpuElementwiseKernel.cpp",
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001409 "src/runtime/NEON/functions/NEElementwiseOperations.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001410 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001411 "neon":{
1412 "fp32": ["src/cpu/kernels/elementwise_binary/generic/neon/fp32.cpp"],
1413 "fp16": ["src/cpu/kernels/elementwise_binary/generic/neon/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001414 "integer": ["src/cpu/kernels/elementwise_binary/generic/neon/integer.cpp"],
1415 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8.cpp"],
1416 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001417 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001418 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001419 "common": ["src/cpu/kernels/elementwise_binary/generic/sve/impl.cpp" ],
1420 "integer": ["src/cpu/kernels/elementwise_binary/generic/sve/integer.cpp"],
1421 "fp32": ["src/cpu/kernels/elementwise_binary/generic/sve/fp32.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001422 "fp16": ["src/cpu/kernels/elementwise_binary/generic/sve/fp16.cpp"]
1423
ramelg01a1f78512022-06-29 16:28:10 +01001424 },
Dana Zlotnik6a2df882022-01-17 09:54:26 +02001425 "sve2":{
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001426 "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8.cpp"],
1427 "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001428 }
1429 }
1430 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001431 "ElementwiseUnary":{
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001432 "deps": [ "LUT" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001433 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001434 "common": [
1435 "src/cpu/operators/CpuElementwiseUnary.cpp",
1436 "src/cpu/kernels/CpuElementwiseUnaryKernel.cpp",
1437 "src/runtime/NEON/functions/NEElementwiseUnaryLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001438 ],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001439 "neon": {
Dana Zlotnika538ae52022-02-21 13:12:41 +02001440 "common":["src/cpu/kernels/elementwise_unary/generic/neon/impl.cpp"],
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001441 "integer": ["src/cpu/kernels/elementwise_unary/generic/neon/integer.cpp"],
1442 "fp32": ["src/cpu/kernels/elementwise_unary/generic/neon/fp32.cpp"],
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001443 "fp16": ["src/cpu/kernels/elementwise_unary/generic/neon/fp16.cpp"],
Ramy Elgammal8b7f42a2023-03-31 16:16:15 +01001444 "qasymm8": [
1445 "src/cpu/kernels/elementwise_unary/generic/neon/q8.cpp",
1446 "src/cpu/kernels/elementwise_unary/generic/neon/qasymm8.cpp"
1447 ],
1448 "qasymm8_signed": [
1449 "src/cpu/kernels/elementwise_unary/generic/neon/q8.cpp",
1450 "src/cpu/kernels/elementwise_unary/generic/neon/qasymm8_signed.cpp"
1451 ]
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001452 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01001453 "sve": {
Dana Zlotnikd5c496d2021-11-28 14:46:12 +02001454 "common": ["src/cpu/kernels/elementwise_unary/generic/sve/impl.cpp" ],
1455 "integer": ["src/cpu/kernels/elementwise_unary/generic/sve/integer.cpp"],
1456 "fp32": ["src/cpu/kernels/elementwise_unary/generic/sve/fp32.cpp"],
SiCong Lic0463a22023-05-17 13:46:13 +01001457 "fp16": ["src/cpu/kernels/elementwise_unary/generic/sve/fp16.cpp"]
1458 },
1459 "sve2": {
1460 "qasymm8": ["src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp"],
1461 "qasymm8_signed": ["src/cpu/kernels/elementwise_unary/generic/sve2/q8.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001462 }
1463 }
1464 },
1465 "FFT1D": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001466 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001467 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001468 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001469 "src/core/NEON/kernels/NEFFTDigitReverseKernel.cpp",
1470 "src/core/NEON/kernels/NEFFTRadixStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001471 "src/core/NEON/kernels/NEFFTScaleKernel.cpp",
1472 "src/runtime/NEON/functions/NEFFT1D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001473 ]
1474 }
1475 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001476 "FFT2D": {
1477 "deps": [ "FFT1D" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001478 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001479 "common": [
1480 "src/runtime/NEON/functions/NEFFT2D.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001481 ]
1482 }
1483 },
1484 "Fill": {
1485 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001486 "common": [
1487 "src/cpu/operators/CpuFill.cpp",
1488 "src/cpu/kernels/CpuFillKernel.cpp",
1489 "src/runtime/NEON/functions/NEFill.cpp"
1490 ]
1491 }
1492 },
1493 "Flatten": {
1494 "deps: ": [ "Reshape" ],
1495 "files": {
1496 "common": [
1497 "src/cpu/operators/CpuFlatten.cpp",
1498 "src/runtime/NEON/functions/NEFlattenLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001499 ]
1500 }
1501 },
1502 "Floor": {
1503 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001504 "common": [
1505 "src/cpu/operators/CpuFloor.cpp",
1506 "src/cpu/kernels/CpuFloorKernel.cpp",
1507 "src/runtime/NEON/functions/NEFloor.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001508 ],
1509 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001510 "fp32": [ "src/cpu/kernels/floor/neon/fp32.cpp" ],
1511 "fp16": [ "src/cpu/kernels/floor/neon/fp16.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001512 }
1513 }
1514 },
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001515 "FullyConnected": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001516 "deps": [ "Flatten", "Gemm", "Transpose"],
Michele Di Giorgiod9cdf142021-07-02 15:17:08 +01001517 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001518 "common": [
1519 "src/cpu/kernels/CpuConvertFullyConnectedWeightsKernel.cpp",
1520 "src/cpu/operators/CpuConvertFullyConnectedWeights.cpp",
1521 "src/cpu/operators/CpuFullyConnected.cpp",
1522 "src/runtime/NEON/functions/NEConvertFullyConnectedWeights.cpp",
1523 "src/runtime/NEON/functions/NEFullyConnectedLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001524 ]
1525 }
1526 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001527 "Gather": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001528 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001529 "common": [
1530 "src/core/NEON/kernels/NEGatherKernel.cpp",
1531 "src/runtime/NEON/functions/NEGather.cpp"
1532 ]
1533 }
1534 },
1535 "Gemm": {
Freddie Liardet487d3902021-09-21 12:36:43 +01001536 "deps": [ "Quantize", "Add"],
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001537 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001538 "common": [
1539 "src/cpu/kernels/CpuConvertQuantizedSignednessKernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001540 "src/cpu/kernels/CpuGemmMatrixAdditionKernel.cpp",
1541 "src/cpu/kernels/CpuGemmMatrixMultiplyKernel.cpp",
1542 "src/cpu/kernels/CpuGemmTranspose1xWKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001543 "src/cpu/kernels/CpuGemmInterleave4x4Kernel.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001544 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ScaleKernel.cpp",
1545 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt16ScaleByFixedPointKernel.cpp",
1546 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt8ScaleByFixedPointKernel.cpp",
1547 "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToUint8ScaleByFixedPointKernel.cpp",
1548 "src/cpu/kernels/CpuGemmLowpMatrixMultiplyKernel.cpp",
1549 "src/cpu/kernels/CpuGemmLowpMatrixReductionKernel.cpp",
1550 "src/cpu/kernels/CpuGemmLowpOffsetContributionOutputStageKernel.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001551 "src/cpu/kernels/CpuGemmLowpOffsetContributionKernel.cpp",
1552 "src/cpu/operators/CpuGemm.cpp",
1553 "src/cpu/operators/CpuGemmLowpOutputStage.cpp",
1554 "src/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001555 "src/runtime/NEON/functions/NEGEMM.cpp",
1556 "src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001557 "src/runtime/NEON/functions/NEGEMMLowpOutputStage.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001558 ],
1559 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001560 "common": [
1561 "src/core/NEON/kernels/arm_gemm/gemm_bf16.cpp",
1562 "src/core/NEON/kernels/arm_gemm/gemm_fp16.cpp",
1563 "src/core/NEON/kernels/arm_gemm/gemm_fp32.cpp",
1564 "src/core/NEON/kernels/arm_gemm/gemm_int16.cpp",
1565 "src/core/NEON/kernels/arm_gemm/gemm_int8.cpp",
1566 "src/core/NEON/kernels/arm_gemm/gemm_qint8.cpp",
1567 "src/core/NEON/kernels/arm_gemm/gemm_quint8.cpp",
1568 "src/core/NEON/kernels/arm_gemm/gemm_uint16.cpp",
1569 "src/core/NEON/kernels/arm_gemm/gemm_uint8.cpp",
1570 "src/core/NEON/kernels/arm_gemm/interleave_indirect.cpp",
1571 "src/core/NEON/kernels/arm_gemm/mergeresults-fp16.cpp",
1572 "src/core/NEON/kernels/arm_gemm/mergeresults.cpp",
1573 "src/core/NEON/kernels/arm_gemm/misc.cpp",
1574 "src/core/NEON/kernels/arm_gemm/quantized.cpp",
1575 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_s8.cpp",
1576 "src/core/NEON/kernels/arm_gemm/rowsum_indirect_u8.cpp",
1577 "src/core/NEON/kernels/arm_gemm/transform.cpp",
1578 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s16_8x12/generic.cpp",
1579 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_4x4/generic.cpp",
1580 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/a55r1.cpp",
1581 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/generic.cpp",
1582 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/x1.cpp",
1583 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u16_8x12/generic.cpp",
1584 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4/generic.cpp",
1585 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/a55r1.cpp",
1586 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/generic.cpp",
1587 "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/x1.cpp",
1588 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/a55r1.cpp",
1589 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/generic.cpp",
1590 "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/x1.cpp",
1591 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_dot_6x16/generic.cpp",
1592 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_mmla_6x16/generic.cpp",
1593 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/a55.cpp",
1594 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/generic.cpp",
1595 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/a55.cpp",
1596 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/generic.cpp",
1597 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/a55.cpp",
1598 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/generic.cpp",
1599 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/a55.cpp",
1600 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/generic.cpp",
1601 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1602 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_6x16/generic.cpp",
1603 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/a55.cpp",
1604 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/generic.cpp",
1605 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_mmla_4x16/generic.cpp",
1606 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/a55.cpp",
1607 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/generic.cpp",
1608 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_mmla_6x16/generic.cpp",
1609 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/a55.cpp",
1610 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/generic.cpp",
1611 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_mmla_6x16/generic.cpp",
1612 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/a55.cpp",
1613 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/generic.cpp",
1614 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_mmla_4x16/generic.cpp",
1615 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/a55.cpp",
1616 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/generic.cpp",
1617 "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_mmla_6x16/generic.cpp",
1618 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/generic.cpp",
1619 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/x1.cpp",
1620 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/generic.cpp",
1621 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/a510.cpp",
1622 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/generic.cpp",
1623 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/a510.cpp",
1624 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/generic.cpp",
1625 "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/a510.cpp",
1626 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a53.cpp",
1627 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55.cpp",
1628 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55r1.cpp",
1629 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/generic.cpp",
1630 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/x1.cpp",
1631 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x6/generic.cpp",
1632 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_6x4/generic.cpp",
1633 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_8x4/generic.cpp",
1634 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/a55.cpp",
1635 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/generic.cpp",
1636 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/a55.cpp",
1637 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/generic.cpp",
1638 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/a55.cpp",
1639 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/generic.cpp",
1640 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/a55.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001641 "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/generic.cpp",
Dana Zlotnik256ac622022-02-02 15:06:11 +02001642 "src/cpu/kernels/gemm_matrix_mul/generic/neon/impl.cpp",
1643 "src/cpu/kernels/gemm_matrix_add/generic/neon/impl.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001644 ],
Dana Zlotnik256ac622022-02-02 15:06:11 +02001645 "fp32":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp32.cpp",
1646 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp32.cpp"],
1647 "fp16":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp16.cpp",
1648 "src/cpu/kernels/gemm_matrix_add/generic/neon/fp16.cpp"],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001649 "estate32": [
1650 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a53.cpp",
1651 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a55r1.cpp",
1652 "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/generic.cpp"
1653 ],
1654 "estate64": [
Freddie Liardet487d3902021-09-21 12:36:43 +01001655 "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemv_pretransposed/generic.cpp"
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001656 ],
Nathan John Sircombed7113e42023-04-26 15:02:43 +01001657 "fixed_format_kernels": [
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001658 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_bf16fp32_mmla_6x16/generic.cpp",
1659 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp16_mla_6x32/generic.cpp",
1660 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32_mla_6x16/generic.cpp",
1661 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1662 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_dot_8x12/generic.cpp",
1663 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_mmla_8x12/generic.cpp",
1664 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp16_mla_8x24/generic.cpp",
1665 "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp32_mla_8x12/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001666 ]
1667 },
1668 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001669 "common": [
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001670 "src/core/NEON/kernels/arm_gemm/interleave_indirect-sve.cpp",
1671 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_bf16fp32_dot_16VL/generic.cpp",
1672 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32_mla_16VL/generic.cpp",
1673 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32bf16fp32_dot_16VL/generic.cpp",
1674 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_s8qa_dot_16VL/generic.cpp",
1675 "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_u8qa_dot_16VL/generic.cpp",
1676 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_1VLx4VL/generic.cpp",
1677 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_2VLx2VL/generic.cpp",
1678 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_4VLx1VL/generic.cpp",
David Mansellaaa9da12023-03-10 13:48:50 +00001679 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_1VLx4VL/generic.cpp",
1680 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_2VLx2VL/generic.cpp",
1681 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_4VLx1VL/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001682 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_1VLx4VL/generic.cpp",
1683 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_2VLx2VL/generic.cpp",
1684 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_4VLx1VL/generic.cpp",
1685 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_1VLx4VL/generic.cpp",
1686 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_2VLx2VL/generic.cpp",
1687 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_4VLx1VL/generic.cpp",
1688 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_1VLx4VL/generic.cpp",
1689 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_2VLx2VL/generic.cpp",
1690 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_4VLx1VL/generic.cpp",
1691 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_1VLx4VL/generic.cpp",
1692 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_2VLx2VL/generic.cpp",
1693 "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_4VLx1VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001694 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001695 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1696 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001697 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001698 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001699 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001700 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001701 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001702 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1703 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001704 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001705 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_mmla_4x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001706 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001707 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_mmla_6x4VL/generic.cpp",
1708 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001709 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001710 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001711 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_dot_4x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001712 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_mmla_4x4VL/generic.cpp",
1713 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001714 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001715 "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_mmla_6x4VL/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001716 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_dot_8x3VL/generic.cpp",
1717 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001718 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001719 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001720 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001721 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/generic.cpp",
1722 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001723 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001724 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/generic.cpp",
1725 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001726 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/a64fx.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001727 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/generic.cpp",
1728 "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_mmla_8x3VL/generic.cpp",
Georgios Pinitas4ee8b152021-07-16 16:16:43 +01001729 "src/core/NEON/kernels/arm_gemm/mergeresults-sve.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001730 "src/core/NEON/kernels/arm_gemm/transform-sve.cpp",
1731 "src/core/NEON/kernels/arm_gemm/misc-sve.cpp"
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001732 ],
Nathan John Sircombed7113e42023-04-26 15:02:43 +01001733 "fixed_format_kernels": [
Francesco.Petrogalli@arm.com5fcf22d2022-04-05 10:31:08 +00001734 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1735 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/a64fx.cpp",
1736 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/generic.cpp",
1737 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/a64fx.cpp",
1738 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/generic.cpp",
1739 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1740 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_bf16fp32_mmla_8x3VL/generic.cpp",
1741 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/a64fx.cpp",
1742 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/generic.cpp",
1743 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/a64fx.cpp",
1744 "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/generic.cpp"
1745 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001746 }
1747 }
1748 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001749 "GenerateProposals": {
1750 "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001751 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001752 "common": [
1753 "src/core/NEON/kernels/NEGenerateProposalsLayerKernel.cpp",
1754 "src/runtime/NEON/functions/NEGenerateProposalsLayer.cpp"
Dana Zlotnik50ce2772021-12-29 13:55:56 +02001755 ],
1756 "neon":{
1757 "common":["src/cpu/kernels/genproposals/generic/neon/impl.cpp"],
1758 "fp16":["src/cpu/kernels/genproposals/generic/neon/fp16.cpp"],
1759 "fp32":["src/cpu/kernels/genproposals/generic/neon/fp32.cpp"],
1760 "qsymm16":["src/cpu/kernels/genproposals/generic/neon/qsymm16.cpp"]
1761 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001762 }
1763 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001764 "InstanceNormalize": {
1765 "deps": [ "Permute", "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001766 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001767 "common": [
1768 "src/core/NEON/kernels/NEInstanceNormalizationLayerKernel.cpp",
1769 "src/runtime/NEON/functions/NEInstanceNormalizationLayer.cpp"
ramelg01a1f78512022-06-29 16:28:10 +01001770 ],
Dana Zlotnikd7e2ec52022-01-03 10:59:41 +02001771 "neon":{
1772 "common":["src/cpu/kernels/instancenorm/generic/neon/impl.cpp"],
1773 "fp16":["src/cpu/kernels/instancenorm/generic/neon/fp16.cpp"],
1774 "fp32":["src/cpu/kernels/instancenorm/generic/neon/fp32.cpp"]
1775 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001776 }
1777 },
1778 "L2Normalize": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001779 "deps": [ "Reduction" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001780 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001781 "common": [
1782 "src/core/NEON/kernels/NEL2NormalizeLayerKernel.cpp",
1783 "src/runtime/NEON/functions/NEL2NormalizeLayer.cpp"
Yair Schwarzbaum5e993182022-01-10 15:11:07 +02001784 ],
1785 "neon":{
1786 "common":["src/cpu/kernels/l2normlayer/generic/neon/impl.cpp"],
1787 "fp32":["src/cpu/kernels/l2normlayer/generic/neon/fp32.cpp"],
1788 "fp16":["src/cpu/kernels/l2normlayer/generic/neon/fp16.cpp"]
1789 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01001790 }
1791 },
1792 "Logical": {
1793 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001794 "common": [
1795 "src/core/NEON/kernels/NELogicalKernel.cpp",
1796 "src/runtime/NEON/functions/NELogical.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001797 ]
1798 }
1799 },
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001800 "LUT": {
1801 "files": {
1802 "common": [],
1803 "neon":{
1804 "qasymm8": ["src/cpu/kernels/lut/generic/neon/u8.cpp"],
1805 "qasymm8_signed": ["src/cpu/kernels/lut/generic/neon/u8.cpp"]
1806 },
SiCong Lic0463a22023-05-17 13:46:13 +01001807 "sve2": {
1808 "qasymm8": ["src/cpu/kernels/lut/generic/sve2/u8.cpp"],
1809 "qasymm8_signed": ["src/cpu/kernels/lut/generic/sve2/u8.cpp"]
Viet-Hoa Dofd472f02023-03-15 14:05:06 +00001810 }
1811 }
1812 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001813 "LSTM": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01001814 "deps": [
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001815 "Activation",
1816 "Concatenate",
1817 "Copy",
1818 "Dequantize",
1819 "ElementwiseBinary",
1820 "Fill",
1821 "FullyConnected",
1822 "Gemm",
1823 "MeanStdDevNormalize",
1824 "Mul",
1825 "Quantize",
1826 "Slice",
1827 "Transpose"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001828 ],
1829 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001830 "common": [
1831 "src/core/NEON/kernels/NEQLSTMLayerNormalizationKernel.cpp",
1832 "src/runtime/NEON/functions/NELSTMLayer.cpp",
1833 "src/runtime/NEON/functions/NELSTMLayerQuantized.cpp",
1834 "src/runtime/NEON/functions/NEQLSTMLayer.cpp"
1835 ]
1836 }
1837 },
1838 "MaxUnpool2d": {
1839 "deps": [ "Fill" ],
1840 "files": {
1841 "common": [
Dana Zlotnik149203b2022-01-26 12:38:03 +02001842 "src/cpu/kernels/CpuMaxUnpoolingLayerKernel.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001843 "src/runtime/NEON/functions/NEMaxUnpoolingLayer.cpp",
Dana Zlotnik149203b2022-01-26 12:38:03 +02001844 "src/cpu/operators/CpuMaxUnpooling.cpp"
Dana Zlotnik143310c2021-12-30 13:24:52 +02001845 ],
1846 "neon":{
Dana Zlotnik143310c2021-12-30 13:24:52 +02001847 "fp32":["src/cpu/kernels/maxunpool/generic/neon/fp32.cpp"],
1848 "fp16":["src/cpu/kernels/maxunpool/generic/neon/fp16.cpp"],
1849 "qasymm8":["src/cpu/kernels/maxunpool/generic/neon/qasymm8.cpp"],
Dana Zlotnik149203b2022-01-26 12:38:03 +02001850 "qasymm8_signed":[ "src/cpu/kernels/maxunpool/generic/neon/qasymm8_signed.cpp"],
1851 "common":["src/cpu/kernels/maxunpool/generic/neon/impl.cpp"]
Dana Zlotnik143310c2021-12-30 13:24:52 +02001852 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001853 }
1854 },
1855 "Mean": {
1856 "deps" : [ "Reduction" ],
1857 "files": {
1858 "common": [ "src/runtime/NEON/functions/NEReduceMean.cpp" ]
1859 }
1860 },
1861 "MeanStdDevNormalize": {
1862 "files": {
1863 "common": [
1864 "src/core/NEON/kernels/NEMeanStdDevNormalizationKernel.cpp",
1865 "src/runtime/NEON/functions/NEMeanStdDevNormalizationLayer.cpp"
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001866 ],
1867 "neon":{
1868 "common":["src/cpu/kernels/meanstddevnorm/generic/neon/impl.cpp"],
1869 "fp32":["src/cpu/kernels/meanstddevnorm/generic/neon/fp32.cpp"],
Murray Kornelsen6e09e142022-07-13 21:40:26 -04001870 "fp16":["src/cpu/kernels/meanstddevnorm/generic/neon/fp16.cpp"],
1871 "qasymm8":["src/cpu/kernels/meanstddevnorm/generic/neon/qasymm8.cpp"]
Dana Zlotnik027bcef2021-12-27 17:35:00 +02001872 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001873 }
1874 },
Mohammed Suhail Munshia1b1e412023-03-23 22:21:31 +00001875 "MatMul" : {
Viet-Hoa Do99b6fd22023-04-27 17:06:10 +01001876 "deps": [ "Transpose" ],
Mohammed Suhail Munshia1b1e412023-03-23 22:21:31 +00001877 "files": {
1878 "common": [
1879 "src/cpu/operators/CpuMatMul.cpp",
1880 "src/runtime/NEON/functions/NEMatMul.cpp"
1881 ]
1882 }
1883 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001884 "Mul": {
1885 "files": {
1886 "common": [
1887 "src/cpu/operators/CpuMul.cpp",
1888 "src/cpu/kernels/CpuMulKernel.cpp",
1889 "src/runtime/NEON/functions/NEPixelWiseMultiplication.cpp"
1890 ]
1891 }
1892 },
1893 "Normalize": {
1894 "deps": [ "Mul" ],
1895 "files": {
1896 "common": [
1897 "src/core/NEON/kernels/NENormalizationLayerKernel.cpp",
1898 "src/runtime/NEON/functions/NENormalizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001899 ]
1900 }
1901 },
1902 "Pad": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001903 "deps": [ "Concatenate", "Copy", "StridedSlice" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01001904 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001905 "common": [
1906 "src/core/NEON/kernels/NEPadLayerKernel.cpp",
1907 "src/runtime/NEON/functions/NEPadLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001908 ]
1909 }
1910 },
1911 "Permute": {
1912 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001913 "common": [
1914 "src/cpu/operators/CpuPermute.cpp",
1915 "src/cpu/kernels/CpuPermuteKernel.cpp",
1916 "src/runtime/NEON/functions/NEPermute.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001917 ]
1918 }
1919 },
1920 "Pool2d": {
1921 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001922 "common": [
1923 "src/cpu/operators/CpuPool2d.cpp",
Georgios Pinitas7891a732021-08-20 21:39:25 +01001924 "src/cpu/kernels/CpuPool2dKernel.cpp",
1925 "src/cpu/kernels/internal/CpuPool2dAssemblyWrapperKernel.cpp",
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001926 "src/runtime/NEON/functions/NEPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01001927 ],
1928 "neon": {
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001929 "common": [
1930 "src/core/NEON/kernels/arm_conv/pooling/kernels/cpp_nhwc_1x1_stride_any_depthfirst/generic.cpp",
1931 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp16.cpp",
1932 "src/core/NEON/kernels/arm_conv/pooling/pooling_fp32.cpp",
1933 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8.cpp",
1934 "src/core/NEON/kernels/arm_conv/pooling/pooling_s8q.cpp",
1935 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8.cpp",
1936 "src/core/NEON/kernels/arm_conv/pooling/pooling_u8q.cpp",
1937 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1938 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1939 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1940 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1941 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1942 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1943 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1944 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1945 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1946 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1947 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_generic_depthfirst/generic.cpp",
1948 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1949 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1950 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1951 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1952 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_generic_depthfirst/generic.cpp",
1953 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
ramelg01a1f78512022-06-29 16:28:10 +01001954 "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Motti Gondabi9d9ad332022-01-23 12:42:24 +02001955 ],
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001956 "nchw": [ "src/cpu/kernels/pool2d/neon/nchw/all.cpp" ],
1957 "fp16": [ "src/cpu/kernels/pool2d/neon/fp16.cpp" ],
ramelg01a1f78512022-06-29 16:28:10 +01001958 "fp32": [ "src/cpu/kernels/pool2d/neon/fp32.cpp" ],
1959 "qasymm8":[ "src/cpu/kernels/pool2d/neon/qasymm8.cpp" ],
Dana Zlotnika538ae52022-02-21 13:12:41 +02001960 "qasymm8_signed":["src/cpu/kernels/pool2d/neon/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01001961 },
1962 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001963 "common": [
Michalis Spyrou20fca522021-06-07 14:23:57 +01001964 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1965 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1966 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1967 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_generic_depthfirst/generic.cpp",
Georgios Pinitasb6af4822021-09-14 12:33:34 +01001968 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1969 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1970 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1971 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_generic_depthfirst/generic.cpp",
Michalis Spyrou20fca522021-06-07 14:23:57 +01001972 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1973 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1974 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_generic_depthfirst/generic.cpp",
1975 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1976 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1977 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1978 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1979 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_generic_depthfirst/generic.cpp",
1980 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
Viet-Hoa Do03b29712022-06-01 11:47:14 +01001981 "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_max_generic_depthfirst/generic.cpp",
1982 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1983 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1984 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1985 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1986 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1987 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1988 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1989 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1990 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1991 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1992 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_generic_depthfirst/generic.cpp",
1993 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1994 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1995 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1996 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1997 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_generic_depthfirst/generic.cpp",
1998 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
1999 "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_max_generic_depthfirst/generic.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002000 ]
2001 }
2002 }
2003 },
Adnan AlSinan171fc3d2022-03-15 18:46:42 +00002004 "Pool3d": {
2005 "files": {
2006 "common": [
2007 "src/cpu/operators/CpuPool3d.cpp",
2008 "src/cpu/kernels/CpuPool3dKernel.cpp",
2009 "src/runtime/NEON/functions/NEPooling3dLayer.cpp"
2010 ],
2011 "neon": {
Adnan AlSinan9104cd52022-04-06 16:19:31 +01002012 "common": [ "src/cpu/kernels/pool3d/neon/impl.cpp" ],
2013 "fp16": [ "src/cpu/kernels/pool3d/neon/fp16.cpp" ],
2014 "fp32": [ "src/cpu/kernels/pool3d/neon/fp32.cpp" ],
2015 "qasymm8": [ "src/cpu/kernels/pool3d/neon/qasymm8.cpp" ],
2016 "qasymm8_signed": [ "src/cpu/kernels/pool3d/neon/qasymm8_signed.cpp" ]
Adnan AlSinan171fc3d2022-03-15 18:46:42 +00002017 }
2018 }
2019 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002020 "PRelu": {
2021 "deps": [ "ElementwiseBinary" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01002022 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002023 "common": [
2024 "src/runtime/NEON/functions/NEPReluLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002025 ]
2026 }
2027 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002028 "PriorBox": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002029 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002030 "common": [
2031 "src/core/NEON/kernels/NEPriorBoxLayerKernel.cpp",
2032 "src/runtime/NEON/functions/NEPriorBoxLayer.cpp"
2033 ]
2034 }
2035 },
2036 "Quantize": {
2037 "files": {
2038 "common": [
2039 "src/cpu/operators/CpuQuantize.cpp",
2040 "src/cpu/kernels/CpuQuantizeKernel.cpp",
2041 "src/runtime/NEON/functions/NEQuantizationLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002042 ]
2043 }
2044 },
2045 "Range": {
2046 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002047 "common": [
2048 "src/core/NEON/kernels/NERangeKernel.cpp",
2049 "src/runtime/NEON/functions/NERange.cpp"
Yair Schwarzbaum9e8a7702021-11-08 10:58:06 +02002050 ],
2051 "neon": {
2052 "common": [ "src/cpu/kernels/range/generic/neon/impl.cpp" ],
2053 "fp32": [ "src/cpu/kernels/range/generic/neon/fp32.cpp" ],
2054 "fp16": [ "src/cpu/kernels/range/generic/neon/fp16.cpp" ],
2055 "integer": [ "src/cpu/kernels/range/generic/neon/integer.cpp" ]
2056 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002057 }
2058 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002059 "Reduction":{
2060 "deps": [ "Reshape" ],
Michalis Spyrou20fca522021-06-07 14:23:57 +01002061 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002062 "common": [
2063 "src/core/NEON/kernels/NEReductionOperationKernel.cpp",
2064 "src/runtime/NEON/functions/NEReductionOperation.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002065 ]
2066 }
2067 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002068 "Reorg": {
2069 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002070 "common": [
2071 "src/core/NEON/kernels/NEReorgLayerKernel.cpp",
2072 "src/runtime/NEON/functions/NEReorgLayer.cpp"
2073 ]
2074 }
2075 },
2076 "Reshape": {
2077 "files": {
2078 "common": [
2079 "src/cpu/operators/CpuReshape.cpp",
2080 "src/cpu/kernels/CpuReshapeKernel.cpp",
2081 "src/runtime/NEON/functions/NEReshapeLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002082 ]
2083 }
2084 },
David Svantesson3b162e52023-03-28 14:13:32 +00002085 "Reorder": {
2086 "files": {
2087 "common": [
David Svantessonf0ff76d2023-04-28 16:34:52 +00002088 "src/runtime/NEON/functions/NEReorderLayer.cpp",
David Svantesson3b162e52023-03-28 14:13:32 +00002089 "src/core/NEON/kernels/NEReorderKernel.cpp"
2090 ]
2091 }
2092 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002093 "Reverse": {
2094 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002095 "common": [
2096 "src/core/NEON/kernels/NEReverseKernel.cpp",
2097 "src/runtime/NEON/functions/NEReverse.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002098 ]
2099 }
2100 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002101 "RNN": {
2102 "deps": [ "Activation", "Add", "FullyConnected", "Gemm"],
2103 "files": {
2104 "common": [ "src/runtime/NEON/functions/NERNNLayer.cpp" ]
2105 }
2106 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002107 "ROIAlign": {
2108 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002109 "common": [
2110 "src/core/NEON/kernels/NEROIAlignLayerKernel.cpp",
2111 "src/runtime/NEON/functions/NEROIAlignLayer.cpp"
Dana Zlotnik9ae5a4e2022-01-03 16:22:47 +02002112 ],
2113 "neon":{
2114 "common":["src/cpu/kernels/roialign/generic/neon/impl.cpp"],
2115 "fp32":["src/cpu/kernels/roialign/generic/neon/fp32.cpp"],
2116 "fp16":["src/cpu/kernels/roialign/generic/neon/fp16.cpp"],
2117 "qasymm8":["src/cpu/kernels/roialign/generic/neon/qasymm8.cpp"],
2118 "qasymm8_signed":["src/cpu/kernels/roialign/generic/neon/qasymm8_signed.cpp"]
2119 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002120 }
2121 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002122 "ROIPool2d": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002123 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002124 "common": [
2125 "src/core/NEON/kernels/NEROIPoolingLayerKernel.cpp",
2126 "src/runtime/NEON/functions/NEROIPoolingLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002127 ]
2128 }
2129 },
2130 "Scale": {
2131 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002132 "common": [
2133 "src/cpu/operators/CpuScale.cpp",
2134 "src/cpu/kernels/CpuScaleKernel.cpp",
2135 "src/runtime/NEON/functions/NEScale.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002136 ],
2137 "sve": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002138 "fp16": [ "src/cpu/kernels/scale/sve/fp16.cpp" ],
2139 "fp32": [ "src/cpu/kernels/scale/sve/fp32.cpp" ],
2140 "integer": [ "src/cpu/kernels/scale/sve/integer.cpp" ],
2141 "qasymm8": [ "src/cpu/kernels/scale/sve/qasymm8.cpp" ],
2142 "qasymm8_signed": [ "src/cpu/kernels/scale/sve/qasymm8_signed.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002143 },
2144 "neon": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002145 "fp16": [ "src/cpu/kernels/scale/neon/fp16.cpp" ],
2146 "integer": [ "src/cpu/kernels/scale/neon/integer.cpp" ],
Gunes Bayirc4f27432022-09-11 15:59:19 +01002147 "qasymm8": [ "src/cpu/kernels/scale/neon/qasymm8.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ],
2148 "qasymm8_signed": [ "src/cpu/kernels/scale/neon/qasymm8_signed.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002149 }
2150 }
2151 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002152 "Select": {
2153 "files": {
2154 "common": [
2155 "src/core/NEON/kernels/NESelectKernel.cpp",
2156 "src/runtime/NEON/functions/NESelect.cpp"
Anton Vainer8a9a0fb2022-01-09 14:37:12 +02002157 ],
2158 "neon": {
2159 "common": [ "src/cpu/kernels/select/generic/neon/impl.cpp" ],
2160 "fp32": [ "src/cpu/kernels/select/generic/neon/fp32.cpp" ],
2161 "fp16": [ "src/cpu/kernels/select/generic/neon/fp16.cpp" ],
2162 "integer": [ "src/cpu/kernels/select/generic/neon/integer.cpp" ]
2163 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002164 }
2165 },
2166 "Slice": {
2167 "deps": [ "StridedSlice" ],
2168 "files": {
2169 "common": [ "src/runtime/NEON/functions/NESlice.cpp" ]
2170 }
2171 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002172 "Softmax": {
2173 "deps": [
2174 "Permute"
2175 ],
2176 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002177 "common": [
2178 "src/cpu/operators/CpuSoftmax.cpp",
2179 "src/cpu/kernels/CpuSoftmaxKernel.cpp",
2180 "src/runtime/NEON/functions/NESoftmaxLayer.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002181 ],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002182 "neon":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02002183 "common":["src/cpu/kernels/softmax/generic/neon/impl.cpp"],
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002184 "fp32": ["src/cpu/kernels/softmax/generic/neon/fp32.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01002185 "fp16": ["src/cpu/kernels/softmax/generic/neon/fp16.cpp"],
2186 "qasymm8":[ "src/cpu/kernels/softmax/generic/neon/qasymm8.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002187 "qasymm8_signed":["src/cpu/kernels/softmax/generic/neon/qasymm8_signed.cpp"]
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002188 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002189 "sve": {
Dana Zlotnikc48a3e52021-12-21 13:34:42 +02002190 "common": [ "src/cpu/kernels/softmax/generic/sve/impl.cpp" ],
2191 "fp32": ["src/cpu/kernels/softmax/generic/sve/fp32.cpp"],
2192 "fp16": ["src/cpu/kernels/softmax/generic/sve/fp16.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002193 "qasymm8": ["src/cpu/kernels/softmax/generic/sve/qasymm8.cpp" ],
2194 "qasymm8_signed": ["src/cpu/kernels/softmax/generic/sve/qasymm8_signed.cpp"]
2195 },
2196 "sve2":{
Dana Zlotnika538ae52022-02-21 13:12:41 +02002197 "common" :["src/cpu/kernels/softmax/generic/sve2/impl.cpp"],
ramelg01a1f78512022-06-29 16:28:10 +01002198 "qasymm8":[ "src/cpu/kernels/softmax/generic/sve2/qasymm8.cpp"],
Dana Zlotnik6a2df882022-01-17 09:54:26 +02002199 "qasymm8_signed":["src/cpu/kernels/softmax/generic/sve2/qasymm8_signed.cpp"]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002200 }
2201 }
2202 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002203 "SpaceToBatch": {
2204 "files": {
2205 "common": [
2206 "src/core/NEON/kernels/NESpaceToBatchLayerKernel.cpp",
2207 "src/runtime/NEON/functions/NESpaceToBatchLayer.cpp"
2208 ]
2209 }
2210 },
2211 "SpaceToDepth": {
2212 "files": {
2213 "common": [
2214 "src/core/NEON/kernels/NESpaceToDepthLayerKernel.cpp",
2215 "src/runtime/NEON/functions/NESpaceToDepthLayer.cpp"
2216 ]
2217 }
2218 },
2219 "Split": {
2220 "deps": [ "StridedSlice" ],
2221 "files": {
2222 "common": [
2223 "src/runtime/NEON/functions/NESplit.cpp"
2224 ]
2225 }
2226 },
2227 "Stack": {
2228 "files": {
2229 "common": [
2230 "src/core/NEON/kernels/NEStackLayerKernel.cpp",
2231 "src/runtime/NEON/functions/NEStackLayer.cpp"
2232 ]
2233 }
2234 },
2235 "StridedSlice": {
2236 "files": {
2237 "common": [
2238 "src/core/NEON/kernels/NEStridedSliceKernel.cpp",
2239 "src/runtime/NEON/functions/NEStridedSlice.cpp"
2240 ]
2241 }
2242 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002243 "Sub": {
2244 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002245 "common": [
2246 "src/cpu/operators/CpuSub.cpp",
2247 "src/cpu/kernels/CpuSubKernel.cpp",
Freddie Liardet487d3902021-09-21 12:36:43 +01002248 "src/runtime/NEON/functions/NEArithmeticSubtraction.cpp",
2249 "src/cpu/kernels/sub/neon/qasymm8.cpp",
2250 "src/cpu/kernels/sub/neon/qasymm8_signed.cpp",
2251 "src/cpu/kernels/sub/neon/qsymm16.cpp"
2252 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002253 }
2254 },
Michalis Spyrou20fca522021-06-07 14:23:57 +01002255 "Tile": {
2256 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002257 "common": [
2258 "src/core/NEON/kernels/NETileKernel.cpp",
2259 "src/runtime/NEON/functions/NETile.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002260 ]
2261 }
2262 },
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002263 "Transpose": {
Michalis Spyrou20fca522021-06-07 14:23:57 +01002264 "files": {
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002265 "common": [
2266 "src/cpu/kernels/CpuTransposeKernel.cpp",
2267 "src/cpu/operators/CpuTranspose.cpp",
2268 "src/runtime/NEON/functions/NETranspose.cpp"
Michalis Spyrou20fca522021-06-07 14:23:57 +01002269 ]
2270 }
Georgios Pinitasb6af4822021-09-14 12:33:34 +01002271 },
2272 "Unstack": {
2273 "deps": [ "StridedSlice" ],
2274 "files": {
2275 "common": [ "src/runtime/NEON/functions/NEUnstack.cpp" ]
2276 }
Michalis Spyrou20fca522021-06-07 14:23:57 +01002277 }
2278 }
Giorgio Arena232c4522022-03-03 10:09:01 +00002279 },
2280 "experimental": {
2281 "dynamic_fusion": [
SiCong Lif44bbc52022-08-29 18:25:51 +01002282 "src/dynamic_fusion/runtime/gpu/cl/ClKernelRuntime.cpp",
2283 "src/dynamic_fusion/runtime/gpu/cl/ClWorkloadRuntime.cpp",
Gunes Bayir1dc6ff12022-12-06 20:48:31 +00002284 "src/dynamic_fusion/sketch/attributes/CastAttributes.cpp",
Jakub Sujak32741722022-11-25 16:43:18 +00002285 "src/dynamic_fusion/sketch/attributes/ClampAttributes.cpp",
SiCong Li5a63d1e2023-01-06 16:28:57 +00002286 "src/dynamic_fusion/sketch/attributes/Conv2dAttributes.cpp",
Gunes Bayir7dc02342022-11-21 21:46:50 +00002287 "src/dynamic_fusion/sketch/attributes/DepthwiseConv2dAttributes.cpp",
Mohammed Suhail Munshia18d85c2023-01-03 10:16:16 +00002288 "src/dynamic_fusion/sketch/attributes/Pool2dAttributes.cpp",
Jakub Sujak8ae57142022-12-02 16:09:06 +00002289 "src/dynamic_fusion/sketch/attributes/ResizeAttributes.cpp",
Gunes Bayiraecb5d92022-12-18 21:31:29 +00002290 "src/dynamic_fusion/sketch/attributes/SoftmaxAttributes.cpp",
Ramy Elgammalf800adf2022-12-14 15:39:29 +00002291 "src/dynamic_fusion/sketch/attributes/ReshapeAttributes.cpp",
SiCong Lif44bbc52022-08-29 18:25:51 +01002292 "src/dynamic_fusion/sketch/gpu/GpuKernelArgument.cpp",
2293 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGraph.cpp",
2294 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGroup.cpp",
2295 "src/dynamic_fusion/sketch/gpu/GpuKernelComponentStream.cpp",
2296 "src/dynamic_fusion/sketch/gpu/GpuLogicalKernel.cpp",
2297 "src/dynamic_fusion/sketch/gpu/GpuOperatorGroup.cpp",
2298 "src/dynamic_fusion/sketch/gpu/GpuWorkloadContext.cpp",
2299 "src/dynamic_fusion/sketch/gpu/GpuWorkloadSketch.cpp",
Jakub Sujak32741722022-11-25 16:43:18 +00002300 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentActivation.cpp",
Gunes Bayir1dc6ff12022-12-06 20:48:31 +00002301 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentCast.cpp",
Gunes Bayir7dc02342022-11-21 21:46:50 +00002302 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDepthwiseConv2d.cpp",
SiCong Lif44bbc52022-08-29 18:25:51 +01002303 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDirectConv2d.cpp",
Mohammed Suhail Munshia18d85c2023-01-03 10:16:16 +00002304 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentPool2d.cpp",
Ramy Elgammal404462a2022-11-08 02:14:46 +00002305 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentElementwiseBinary.cpp",
Gunes Bayiraecb5d92022-12-18 21:31:29 +00002306 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentLogits1DMaxShiftExpSum.cpp",
Ramy Elgammal002e6532023-01-11 18:48:04 +00002307 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentLogits1DNorm.cpp",
Ramy Elgammalf800adf2022-12-14 15:39:29 +00002308 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentReshape.cpp",
Jakub Sujak8ae57142022-12-02 16:09:06 +00002309 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentResize.cpp",
SiCong Lif44bbc52022-08-29 18:25:51 +01002310 "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentStore.cpp",
Ramy Elgammal404462a2022-11-08 02:14:46 +00002311 "src/dynamic_fusion/sketch/gpu/operators/GpuAdd.cpp",
Gunes Bayir1dc6ff12022-12-06 20:48:31 +00002312 "src/dynamic_fusion/sketch/gpu/operators/GpuCast.cpp",
Jakub Sujak32741722022-11-25 16:43:18 +00002313 "src/dynamic_fusion/sketch/gpu/operators/GpuClamp.cpp",
Gunes Bayir1dc6ff12022-12-06 20:48:31 +00002314 "src/dynamic_fusion/sketch/gpu/operators/GpuConv2d.cpp",
Jakub Sujak7359a872023-01-05 14:24:13 +00002315 "src/dynamic_fusion/sketch/gpu/operators/GpuDepthwiseConv2d.cpp",
2316 "src/dynamic_fusion/sketch/gpu/operators/GpuMul.cpp",
Ramy Elgammalf800adf2022-12-14 15:39:29 +00002317 "src/dynamic_fusion/sketch/gpu/operators/GpuReshape.cpp",
Mohammed Suhail Munshia18d85c2023-01-03 10:16:16 +00002318 "src/dynamic_fusion/sketch/gpu/operators/GpuPool2d.cpp",
Viet-Hoa Dob84e2532022-12-13 13:09:10 +00002319 "src/dynamic_fusion/sketch/gpu/operators/GpuOutput.cpp",
Jakub Sujak8ae57142022-12-02 16:09:06 +00002320 "src/dynamic_fusion/sketch/gpu/operators/GpuResize.cpp",
Viet-Hoa Do98aca0f2023-03-02 17:43:45 +00002321 "src/dynamic_fusion/sketch/gpu/operators/GpuSigmoid.cpp",
Ramy Elgammal002e6532023-01-11 18:48:04 +00002322 "src/dynamic_fusion/sketch/gpu/operators/GpuSoftmax.cpp",
Ramy Elgammalec320d92022-12-14 09:20:09 +00002323 "src/dynamic_fusion/sketch/gpu/operators/GpuSub.cpp",
Viet-Hoa Do98aca0f2023-03-02 17:43:45 +00002324 "src/dynamic_fusion/sketch/gpu/operators/GpuTanh.cpp",
Ramy Elgammal404462a2022-11-08 02:14:46 +00002325 "src/dynamic_fusion/sketch/gpu/operators/internal/GpuElementwiseBinaryCommon.cpp",
Jakub Sujak32741722022-11-25 16:43:18 +00002326 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateActivation.cpp",
Gunes Bayir1dc6ff12022-12-06 20:48:31 +00002327 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateCast.cpp",
Gunes Bayir7dc02342022-11-21 21:46:50 +00002328 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDepthwiseConv2d.cpp",
SiCong Lif44bbc52022-08-29 18:25:51 +01002329 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp",
Mohammed Suhail Munshia18d85c2023-01-03 10:16:16 +00002330 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplatePool2d.cpp",
Ramy Elgammal404462a2022-11-08 02:14:46 +00002331 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateElementwiseBinary.cpp",
Gunes Bayiraecb5d92022-12-18 21:31:29 +00002332 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateLogits1DMaxShiftExpSum.cpp",
Ramy Elgammal002e6532023-01-11 18:48:04 +00002333 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateLogits1DNorm.cpp",
Ramy Elgammalf800adf2022-12-14 15:39:29 +00002334 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateReshape.cpp",
Jakub Sujak8ae57142022-12-02 16:09:06 +00002335 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateResize.cpp",
SiCong Lif44bbc52022-08-29 18:25:51 +01002336 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateStore.cpp",
2337 "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateWriter.cpp",
2338 "src/dynamic_fusion/sketch/gpu/template_writer/GpuKernelVariableTable.cpp"
Giorgio Arena232c4522022-03-03 10:09:01 +00002339 ]
Michalis Spyrou20fca522021-06-07 14:23:57 +01002340 }
ramelg018a164882022-04-07 02:42:52 +01002341}